source: projects/specs/trunk/h/heartbeat/heartbeat-vl.spec @ 3030

Revision 3030, 60.5 KB checked in by Takemikaduchi, 13 years ago (diff)

heartbeat: rebuild with openssl-1.0.0d

Line 
1%define           ENABLE_SNMP_SUBAGENT 0
2%define           ENABLE_MGMT 1
3%define           uid 24
4%define           gname haclient
5%define           uname hacluster
6
7Summary:          Heartbeat subsystem for High-Availability Linux
8Summary(ja):      高可用性 Linux のための HeartBeat サブシステム
9Name:             heartbeat
10Version:          2.0.8
11Release:          6%{_dist_release}
12
13Group:            System Environment/Daemons
14License:          GPL/LGPL
15URL:              http://linux-ha.org/
16
17Source0:          http://linux-ha.org/download/%{name}-%{version}.tar.gz
18Patch0:           heartbeat-fedora-pam.patch
19Patch1:           heartbeat-fedora-chkconfig.patch
20
21BuildRoot:        %{_tmppath}/%{name}-%{version}-root
22BuildRequires:    glib2-devel
23BuildRequires:    iputils
24BuildRequires:    libnet-devel
25BuildRequires:    libtool-ltdl-devel
26BuildRequires:    net-snmp-devel
27BuildRequires:    bzip2-devel
28BuildRequires:    ncurses-devel
29%if %{ENABLE_MGMT}
30BuildRequires:    gnutls-devel > 2
31BuildRequires:    pam-devel
32BuildRequires:    python-devel
33BuildRequires:    swig
34BuildRequires:    curl-devel
35BuildRequires:    libuuid-devel
36BuildRequires:    libxml2-devel
37%endif
38Requires:         stonith = %{version}-%{release}
39Requires:         pils = %{version}-%{release}
40Requires:         ldirectord = %{version}-%{release}
41Requires:         pygtk2 >= 2.4
42Requires(post):   /sbin/chkconfig
43Requires(preun):  /sbin/chkconfig
44%if %{ENABLE_MGMT}
45Requires:         gettext
46%endif
47
48%description
49heartbeat is a basic high-availability subsystem for Linux-HA.
50It will run scripts at initialization, and when machines go up or down.
51This version will also perform IP address takeover using gratuitous ARPs.
52It supports "n-node" clusters with significant capabilities for managing
53resources and dependencies.
54
55In addition it continues to support the older release 1 style of
562-node clustering.
57
58It implements the following kinds of heartbeats:
59        - Serial ports
60        - UDP/IP multicast (ethernet, etc)
61        - UDP/IP broadcast (ethernet, etc)
62        - UDP/IP heartbeats
63        - "ping" heartbeats (for routers, switches, etc.)
64           (to be used for breaking ties in 2-node systems)
65
66%package -n ldirectord
67Summary:          Monitor daemon for maintaining high availability resources
68Summary(ja):      高可用リソースを管理するための監視デーモン
69Group:            System Environment/Daemons
70Requires:         ipvsadm
71Requires:         %{name} = %{version}
72Requires(post):   /sbin/chkconfig
73Requires(preun):  /sbin/chkconfig
74
75%description -n ldirectord
76ldirectord is a stand-alone daemon to monitor services of real
77for virtual services provided by The Linux Virtual Server
78(http://www.linuxvirtualserver.org/). It is simple to install
79and works with the heartbeat code (http://www.linux-ha.org/).
80
81%package -n stonith
82Summary:        Provides an interface to Shoot The Other Node In The Head
83Group:          System Environment/Daemons
84Requires:       pils = %{version}-%{release}
85
86%description -n stonith
87The STONITH module (a.k.a. STOMITH) provides an extensible interface
88for remotely powering down a node in the cluster.  The idea is quite simple:
89When the software running on one machine wants to make sure another
90machine in the cluster is not using a resource, pull the plug on the other
91machine. It's simple and reliable, albeit admittedly brutal.
92#'
93
94%package -n pils
95Summary:        Provides a general plugin and interface loading library
96Group:          System Environment/Daemons
97
98%description -n pils
99PILS is an generalized and portable open source Plugin and Interface Loading
100System. PILS was developed as part of the Open Cluster Framework reference
101implementation, and is designed to be directly usable by a wide variety of
102other applications.
103PILS manages both plugins (loadable objects), and the interfaces these plugins
104implement. PILS is designed to support any number of plugins implementing any
105number of interfaces.
106
107%package devel
108Summary:        Heartbeat development package
109Summary(ja):    Heartbeat 開発パッケージ
110Group:          Development/Libraries
111Requires:       heartbeat = %{version}-%{release}
112
113%description devel
114Heartbeat development package
115
116%prep
117%setup -q
118%patch0 -p1
119%patch1 -p1
120 
121%build
122# disable-fatal-warnings flag used to disable gcc4.x warnings of 'difference in signedness'
123CFLAGS=${RPM_OPT_FLAGS} \
124%configure \
125  --disable-fatal-warnings \
126  --disable-static \
127%if %{ENABLE_MGMT}
128  --enable-mgmt
129%else
130  --disable-mgmt
131%endif
132make
133
134%install
135rm -rf $RPM_BUILD_ROOT
136mkdir -p $RPM_BUILD_ROOT
137make DESTDIR=$RPM_BUILD_ROOT install
138(
139  cd $RPM_BUILD_ROOT/etc/ha.d/resource.d
140  ln -s /usr/sbin/ldirectord ldirectord
141)
142
143mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/conf
144
145# cleanup
146[ -d $RPM_BUILD_ROOT/usr/man ] && rm -rf $RPM_BUILD_ROOT/usr/man
147[ -d $RPM_BUILD_ROOT/usr/share/libtool ] && rm -rf $RPM_BUILD_ROOT/usr/share/libtool
148find $RPM_BUILD_ROOT -type f -name *.la -exec rm -f {} ';'
149
150sed -i -e '1i# -*-Shell-script-*-' $RPM_BUILD_ROOT/%{_libdir}/heartbeat/ocf-shellfuncs
151sed -i -e '1i# -*-Shell-script-*-' $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/shellfuncs
152chmod -x $RPM_BUILD_ROOT/%{_libdir}/heartbeat/ocf-shellfuncs
153chmod -x $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/shellfuncs
154chmod -x $RPM_BUILD_ROOT/%{_libdir}/heartbeat-gui/pymgmt.py
155
156%clean
157if [ -n "${RPM_BUILD_ROOT}"  -a "${RPM_BUILD_ROOT}" != "/" ]; then
158  rm -rf $RPM_BUILD_ROOT
159fi
160
161%pre
162/usr/sbin/groupadd -g %{uid} %{gname} &>/dev/null || :
163/usr/sbin/useradd -M -r -u %{uid} -s /sbin/nologin -d /var/lib/heartbeat/cores/hacluster \
164        -c 'heartbeat user' -g %{gname} %{uname} &>/dev/null || :
165
166%post
167/sbin/ldconfig
168/sbin/chkconfig --add heartbeat
169
170%preun
171/sbin/chkconfig --del heartbeat
172
173%postun
174/sbin/ldconfig
175test "$1" != 0 || /usr/sbin/userdel  %{uname} &>/dev/null || :
176test "$1" != 0 || /usr/sbin/groupdel %{gname} &>/dev/null || :
177
178%post -n ldirectord
179/sbin/chkconfig --add ldirectord
180
181%preun -n ldirectord
182/sbin/chkconfig --del ldirectord
183
184%post -n stonith -p /sbin/ldconfig
185
186%postun -n stonith -p /sbin/ldconfig
187
188%files
189%doc %{_datadir}/doc/%{name}-%{version}
190%defattr(-,root,root)
191%dir %{_sysconfdir}/ha.d
192%{_sysconfdir}/ha.d/harc
193%config(noreplace) %{_sysconfdir}/ha.d/shellfuncs
194%{_sysconfdir}/ha.d/rc.d
195%config(noreplace) %{_sysconfdir}/ha.d/README.config
196%{_libdir}/heartbeat
197%{_libdir}/heartbeat-gui
198%{_libdir}/libapphb.so.*
199%{_libdir}/libccmclient.so.*
200%{_libdir}/libcib.so.*
201%{_libdir}/libclm.so.*
202%{_libdir}/libcrmcommon.so.*
203%{_libdir}/libtransitioner.so.*
204%{_libdir}/libhbclient.so.*
205%{_libdir}/liblrm.so.*
206%{_libdir}/libpengine.so.*
207%{_libdir}/libplumb.so.*
208%{_libdir}/libplumbgpl.so.*
209%{_libdir}/librecoverymgr.so.*
210%{_libdir}/libstonithd.so.*
211%{_prefix}/lib/ocf
212%{_sysconfdir}/ha.d/resource.d/
213%exclude %{_sysconfdir}/ha.d/resource.d/ldirectord
214%{_sysconfdir}/init.d/heartbeat
215%config(noreplace) %{_sysconfdir}/logrotate.d/heartbeat
216%dir %{_var}/lib/heartbeat
217%dir %{_var}/lib/heartbeat/cores
218%dir %attr (0755, root, root) %{_var}/lib/heartbeat/cores/root
219%dir %attr (0755, nobody, nobody) %{_var}/lib/heartbeat/cores/nobody
220%dir %attr (0755, hacluster, haclient) %{_var}/lib/heartbeat/cores/hacluster
221%dir %{_var}/run/heartbeat
222%attr (0755, hacluster, haclient) %{_bindir}/cl_status
223%{_bindir}/cl_respawn
224%{_sbindir}/crmadmin
225%{_sbindir}/cibadmin
226%{_sbindir}/ccm_tool
227%{_sbindir}/crm_diff
228%{_sbindir}/crm_uuid
229%{_sbindir}/crm_mon
230%{_sbindir}/crm_sh
231%{_sbindir}/iso8601
232%{_sbindir}/crm_master
233%{_sbindir}/crm_standby
234%{_sbindir}/crm_attribute
235%{_sbindir}/crm_resource
236%{_sbindir}/crm_verify
237%{_sbindir}/attrd_updater
238%{_sbindir}/crm_failcount
239%{_sbindir}/ocf-tester
240%dir %attr (755, hacluster, haclient) %{_var}/run/heartbeat/ccm
241%dir %attr (755, hacluster, haclient) %{_var}/run/heartbeat/crm
242%dir %attr (755, hacluster, haclient) %{_var}/lib/heartbeat/crm
243%dir %attr (755, hacluster, haclient) %{_var}/lib/heartbeat/pengine
244%{_mandir}/man1/cl_status.1*
245%{_mandir}/man1/ha_logger.1*
246%{_mandir}/man1/hb_standby.1*
247%{_mandir}/man1/hb_takeover.1*
248%{_mandir}/man1/hb_addnode.1*
249%{_mandir}/man1/hb_delnode.1*
250%{_mandir}/man8/heartbeat.8*
251%{_mandir}/man8/apphbd.8*
252%{_mandir}/man8/ha_logd.8*
253%{_mandir}/man8/cibadmin.8*
254%{_mandir}/man8/crm_resource.8*
255%if %{ENABLE_SNMP_SUBAGENT}
256/LINUX-HA-MIB.mib
257%endif
258%if %{ENABLE_MGMT}
259%{_libdir}/libhbmgmt.so.*
260%{_libdir}/libhbmgmtclient.so.*
261%{_libdir}/libhbmgmtcommon.so.*
262%{_libdir}/libhbmgmttls.so.*
263%config(noreplace) %{_sysconfdir}/pam.d/hbmgmtd
264%{_datadir}/locale/zh_CN/LC_MESSAGES/haclient.mo
265%endif
266
267%files -n ldirectord
268%doc doc/COPYING
269%doc doc/README
270%doc ldirectord/ldirectord.cf
271%defattr(-,root,root)
272%{_sysconfdir}/ha.d/conf
273%{_sbindir}/ldirectord
274%{_sbindir}/supervise-ldirectord-config
275%config(noreplace) %{_sysconfdir}/logrotate.d/ldirectord
276%{_sysconfdir}/init.d/ldirectord
277%{_sysconfdir}/ha.d/resource.d/ldirectord
278%{_mandir}/man8/ldirectord.8*
279%{_mandir}/man8/supervise-ldirectord-config.8*
280
281%files -n stonith
282%doc doc/COPYING
283%doc doc/README
284%defattr(-,root,root)
285%{_libdir}/*.so.*
286%{_libdir}/stonith/
287%{_sbindir}/stonith
288%{_sbindir}/meatclient
289%{_mandir}/man8/stonith.8*
290%{_mandir}/man8/meatclient.8*
291
292%files -n pils
293%doc doc/COPYING
294%doc doc/README
295%defattr(-,root,root)
296/usr/include/pils
297%{_libdir}/libpils.*
298%{_libdir}/pils/
299
300%files devel
301%doc %{_datadir}/doc/%{name}-%{version}
302%defattr(-,root,root)
303%{_includedir}/heartbeat/
304%{_includedir}/clplumbing/
305%{_includedir}/saf/
306%{_includedir}/ocf/
307%{_includedir}/stonith/
308%{_includedir}/pils/
309%{_libdir}/*.so
310
311%changelog
312* Sun Mar 20 2011 Yoji TOYODA <bsyamato@sea.plala.or.jp> 2.0.8-6
313- rebuild with openssl-1.0.0d
314- add BuildRequires: libuuid-devel, libxml2-devel
315
316* Sun Oct  3 2010 Ryoichi INAGAKI <ryo1@bc.wakwak.com> 2.0.8-5
317- rebuilt with new toolchain
318
319* Sun May 17 2009 Ryoichi INAGAKI <ryo1@bc.wakwak.com> 2.0.8-4
320- spec in UTF-8
321- changed devel Group to Development/Libraries
322
323* Tue May 05 2009 Satoshi IWAMOTO <satoshi.iwamoto@nifty.ne.jp> 2.0.8-3
324- new versioning policy
325- rebuild with gnutls 2.6.6, libtool 2.2.6 and curl 7.19.4
326- add BuildRequires: curl-devel
327
328* Sun Jan 06 2008 Shu KONNO <owa@bg.wakwak.com> 2.0.8-0vl2
329- rebuilt with net-snmp-5.4.1
330
331* Sat May 19 2007 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.8-0vl1
332- new upstream release
333- build with new environment
334
335* Mon Oct 30 2006 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.7-0vl2
336- rebuild with gnutls-1.4
337- add Japanese summaries
338
339* Mon Oct 23 2006 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.7-0vl1
340- initial build for Vine Linux based on FE package.
341
342* Wed Aug 30 2006 Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.7-2
343- rebuild for Fedora Extras 6
344
345* Wed Aug 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.7-1
346- upstream version 2.0.7
347
348* Sat Jul 15 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.6-2
349- added BuildReqs: ncurses-devel
350
351* Fri Jul 14 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.6-1
352- upstream version 2.0.6
353
354* Fri Jun 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.5-2
355- bump for gnutls change in devel
356
357* Thu Apr 27 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.5-1
358- upstream version 2.0.5
359- removed patch2 - ownership of /heartbeat/crm/cib.xml is no longer
360  set in cts/CM_LinuxHAv2.py.in
361
362* Wed Mar 29 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.4-2
363- Version 2.0.4
364
365* Wed Mar  1 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-9
366- changed user creation
367- added patch2 heartbeat-2.0.3-fedora-ccmuser.patch 
368
369* Wed Mar  1 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-8
370- specifically excluded ldirectord symlink from heartbeat package
371- removed user and group deletion in postun
372- renamed subpackages ldirectord, pils and stonith to lose prefix heartbeat
373  by using -n
374
375* Tue Feb 28 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-7
376- fixed more rpmlint errors and warnings
377
378* Sat Feb 25 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-6
379- fixed number of rpmlint warnings and errors (still ignores some..)
380- generate 'predictable' uid and gid with fedora-usermgmt to use with
381  configure flag -with-ccmuser-id and groupadd, useradd
382- added Buildreq's: libtool-ltdl-devel, fedora-usermgmt-setup
383  net-snmp-devel, bzip2-devel
384- removed *.so duplication in heartbeat and heartbeat-devel
385- changed file sections
386
387* Fri Feb 24 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-5
388- useradd with fedora-usermgmt
389- added *.so file to -devel sub-package
390
391* Sat Feb 18 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-4
392- removed all perl requires; should be picked up by rpmbuild automagically
393- changed system user creation hacluster part to use baseid:
394  (http://fedoraproject.org/wiki/Packaging/UserCreation)
395
396* Thu Feb 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-3
397- removed Requires: python and gnutls
398- changed _libdir/ocf -> _prefix/lib/ocf
399- reversed subpackages depend on basepackage
400- removed Req swig (kept BuildReq)
401- added Req pygtk2
402
403* Wed Feb 15 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-2
404- fixes for various rpmlint errors and warnings
405- fixed setup -q
406- make subpackages depend on basepackage, not reverse
407- clean buildroot at beginning of install
408- replaced a number of hardcoded paths with RPM macros
409- Changed Group from Networking/Daemons to System Environment/Daemons
410- enable mgmt option
411
412* Sun Feb 12 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-1
413- rebuilt for Fedora Extras
414
415* Fri Feb 10 2006  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
416+ Version 2.0.3 - Bug fixes and significant new features.
417  + Management Daemon/Library and GUI client
418    + provide a management library for manamgement daemon and CIM provider
419    + provide a management daemon and a basic GUI management tool
420  + CIM enablement
421    + CIM (Common Information Model) enablement - works with
422      sblim-sfcb, OpenWBEM, and Pegasus CIMOMs
423    - not yet compiled into our binary RPMs because of dependencies
424  + CRM (Cluster Resource Manager) General
425    + All shutdowns go via the PE/TE - preserves inter-resource ordering
426    + Support for future changes to the CIB (depreciation of cib_fragment)
427    + Overhaul of IPC and HA channel callback logic
428    + Many improvments to the quality and quantity (reduced) of logging
429  + CRMd
430    + Timerless elections - when everyone has voted we're done
431    + Use the replace notification from the CIB to re-update our copy with
432      our view of our peers.
433    + Reliably detect if the LRM connection is still active.
434    + Elections
435      + newer versions defer to older ones in DC elections
436        (opposite of current behavior)
437      + this means that only once the complete cluster has been upgraded will
438        we start acting like the new version and accept new config options
439      + it also means newer PE's and TE's (the most complex pieces) don't need
440        "act like the old version" options and can rely on all slaves being at
441        least as up-to-date as they are
442      + people can run mixed clusters as long as they want
443        (until they want the new PE features)
444      + new DCs only update the version number in the CIB if they have a
445        higher value
446      + nodes that start and have a lower version than that stored in the CIB
447        shut themselves down (the CRM part anyway)
448      + this prevents an admin from introducing old nodes back into an upgraded
449        cluster. It probably doesn't fully understand the config and may not
450        support the actions the PE/TE requires.
451  + CIB (Common Information Base daemon)
452    + Make sure "query only" connections cant modify the CIB
453    + Periodically dump some stats about what the CIB has been doing.
454    + Verify there are no memory leaks
455    + Performance enhancements
456    + Prevent a single CIB client from blocking everyone else
457    + Clients Can be notified of full CIB replacements
458    + record_config_changes option in ha.cf for those worried about
459      the amount of logging.  Defaults to "on".
460    + suppress_cib_writes CIB option replaced with in enable_config_writes ha.cf
461      (enable_config_writes to be removed in 2.0.4)
462    + Never write the status section to disk
463    + Check permissions for the on-disk CIB at startup
464    + Dont trash unreadable on-disk CIBs
465    + Fix for updates made against the whole CIB (not just one section)
466  + PEngine (Policy Engine)
467    + Many improvements to the handling of resource groups
468    + Support "anonymous" clones
469    + Fix stonith ordering
470    + Order DC shutdowns after everyone else's
471    + Support short resource names (for group and clone resources)
472    + The ordering and colocation of grouped resources is now optional
473    + Support probing new nodes for active resources.
474    + All "probe" actions are controlled by the PE.
475      + No resource may be started until the probing is complete.
476      + Do not probe for resources we know to be active on unprobed nodes
477    + When looking for monitor ops, only mark it optional if it was already
478      active on the node we're interested in.
479    + Detect changes to class/type/provider/parameters and force a restart
480      of the resource
481    + New record_pengine_inputs option in ha.cf for those worried about
482      the amount of logging.  Defaults to "on".
483    + Differentiate between config and processing errors
484      + reduces the frequency that we need to log the complete CIB
485    + Make notify for master/slave work
486    + New CIB option: stop_orphan_actions (boolean)
487      If a resource is no longer defined, we can optionally stop it
488    + New CIB option: stop_orphan_actions (boolean)
489      If a monitor op for a given interval is no longer defined, we can
490      optionally stop it
491    + Add support for time and phase-of-the-moon based constraints
492    + Improved failure handling: avoiding false positives
493    + Always create orphaned resources - so they show up in crm_mon
494    + Do not require sequential clone numbers starting at 0
495  + TEngine (transition engine)
496    + Detect old stonith ops
497  + CLIs (Command Line interfaces)
498    + Create a --one-shot option for crm_mon
499    + Switch a number of CLI tools to use the new syncronous connections
500    + Log errors to stderr where they will be seen and therefore useful
501    + Support migration and un-migration of resources and resource groups
502    + Create crm_verify for checking configuration validity
503    + Simplify the passing of XML to cibadmin
504  + Known open bugs worth mentioning:
505    + 1075, 1080, 1081, 1084, 1085, 1064, 1069, 756, 984
506    + 1050, 1082, 1037, 1079
507   
508* Thu Sep 22 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
509+ Version 2.0.2 - small bug fix only release
510  + Fixed a bug in ping directive - it works again
511  + Added a check to BasicSanityCheck to check ping and ping_group directives
512  + fixed cl_status nodestatus to return 0 if a node has status "ping"
513  + fixed a memory leak in the CRM's LRM interface code
514  + fixed code which deterimines which version of the CRM becomes
515    the DC when basic CIB schema versions differ.  It now prefers
516    the older version to be DC instead of the newer version.
517
518* Wed Sep 14 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
519+ Version 2.0.1 -
520  + Communication Layer
521    + netstring encoding format is changed to be more efficient
522    + add compression capability for big messages
523  + Add man pages for hb_standby/hb_takeover   
524  + The assert triggered by 2.0.0 has been fixed
525  + CIB can now contain XML comments and/or be in DOS format   
526  + Includes implementation of the ISO8601 date format
527  + New CLI tools for changing cluster preferences, node attributes
528    and node standby
529  + Improved recovery and placement of group resources
530  + Detection of failed nodes by the Policy Engine is fixed
531  + New Policy Engine features
532    http://www.linux-ha.org/ClusterResourceManager/DTD1.0/Annotated :
533      sections 1.5.[8,9,10,12]
534    + Constraints and instance attributes can now be active conditionally
535    + Rules can now contain other rules
536    + Date/Time based expressions are supported
537    + Cloned resources can now optionally be notified before and after
538      any of its peers are stopped or started.
539    + The cluster can re-evaluate the configuration automatically after
540      a defined interval of idleness
541  + Removed a flow control message which was very annoying when operating
542    in a mixed 1.x/2.x environment
543  -- Known Bugs :-( --
544    - Bug 859 - FSA took too long to complete action - fully recovered from
545    - Bug 882 - IPC channel not connected during shutdown - harmless
546    - Bug 879 - Failed actions cause extra election - harmless
547 Each of these occurs about once or twice in 5000 test iterations
548       - This is probably > 10K failovers
549    - rsc_location constraints cannot have rules that contain other rules
550      (fixed in CVS after release)
551* Fri Jul 29 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
552+ Version 2.0.0 - First stable release of the next generation of the Linux-HA project
553  + Basic Characteristics described here:
554        http://linux-ha.org/FactSheetv2
555  + Core infrastructure improvments:
556    + Messaging (message acknowledging and flow control)
557    + Logging   (logging daemon)
558  + Release 1.x style (2-node) clusters fully supported
559  + Multi-node support (so far up to 16-node clusters tested)
560        See http://linux-ha.org/GettingStartedV2 for more information
561  + New components:
562    + Cluster Information Base    (replicated resource configuration)
563    + Cluster Resource Manager    (supporting 1->N nodes)
564    + Modular Policy Engine       (controlling resource placement)
565    + Local Resource Manager      (policy free, not cluster aware)
566    + Stonith Daemon              (stand-alone fencing  subsytem)
567  + Support for OCF and LSB resource agents
568  + Support for composite resource types (groups, clones)
569  + Support for a rich set of resource location and ordering constraints
570  + Conversion tool for existing haresources
571  + Resources monitored by request
572  + Resource "maintenance" mode
573  + Several failback, failure and "No Quorum" behaviours to choose from
574        (global defaults and per action or resource)
575  + Sample cluster state and configuration monitoring tools
576
577  Known issues in 2.0.0:
578    - Under some rare circumstances the cluster manager will time out
579      while stabilizing a new cluster state.  This appears to be
580        otherwise harmless - the cluster is actually fine.
581        http://www.osdl.org/developer_bugzilla/show_bug.cgi?id=770
582    - Under some rare circumstances, a dev assert will be triggered
583        in unpack.c.  This results in the pengine getting restarted.
584        This is annoying, but not a disaster.
585        http://www.osdl.org/developer_bugzilla/show_bug.cgi?id=797
586
587* Tue May 23 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
588+ Version 1.99.5 - Near-final beta of 2.0.0 release
589  + many bug fixes - code looks very stable at this point
590    -- well tested at this point on 4 and 8 node clusters.
591
592* Thu Apr 07 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
593+ Version 1.99.4 - Near-final beta of 2.0.0 release
594  + many bug fixes since 1.99.1
595  + new external STONITH model - fully supports scripting interface
596  + tested through 12 node clusters successfully
597  + No serious defects found in testing
598  + Easier-to-understand locational constraints model
599  + Many bug fixes of many kinds
600  + Important bug fixes to OCF IPaddr resource agent
601  + Resources are monitored only on request
602  + See http://wiki.linux-ha.org/ClusterResourceManager/Setup
603    for basic ideas about getting started.
604  + Release 1 style (2-node) clusters still fully supported
605  + Release 2 style clusters support 1-N node clusters
606        (where N is probably something like 8-32)
607
608* Tue Mar 20 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
609+ Version 1.99.3 - Near-final beta "technology preview" of 2.0.0 release
610  + many bug fixes since 1.99.1
611  + tested through 12 node clusters with reasonable success
612  + new STONITH API
613
614* Sun Feb 20 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
615+ Version 1.99.2 - Near-final beta "technology preview" of 2.0.0 release
616  + Many many many changes.  Far too many to describe here.
617  + See http://wiki.linux-ha.org/ClusterResourceManager/Setup
618    for certain basic ideas about getting started.
619
620* Mon Oct 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
621+ Version 1.99.1 - *early* beta series - preparing for 2.0.0
622  + Andrew provided a number of fixes to the CRM and 2.0 features
623  + Fixed a problem with retrying failed STONITH operations
624
625* Mon Oct 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
626+ Version 1.99.0 - *early* beta series - preparing for 2.0.0
627  + All STABLE changes noted below have been ported to this branch
628  + Included in this release is a beta of the next generation of Heartbeat
629        resource manager developed by Andrew Beekhof. 
630        http://linuxha.trick.ca/NewHeartbeatDesign is a good place to learn
631        more about this effort. Please examine crm/README, crm/test/README
632        and crm/crm-1.0.dtd for example usage and configuration.
633  + Also included is the L(ocal) R(esource) M(anager) developed by IBM China
634        which is an integral part of the NewHeartbeatDesign.
635  + Known caveats:
636    - STONITH as a whole has seen a code cleanup and should be tested
637      carefully.
638    - The external STONITH plug-in has undergone major surgery and
639      probably doesn't work yet.
640    - the new CRM is not perfectly stable with 3 nodes yet.
641  + PLEASE see http://osdl.org/developer_bugzilla/enter_bug.cgi?product=Linux-HA
642    and use it to report quirks and issues you find!
643 
644* Sat Sep 18 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
645+ Version 1.2.3 (stable)
646  + fixed a serious error which causes heartbeat to misbehave after about
647        10 months of continuous operation
648  + Made our ARP packets more RFC compliant
649  + Extended apcmastersnmp code to deal with new devices
650  + fixed a bug concerning simultaneous stops of both machines causing one
651        of them to not shut down.
652  + added an option to suppress reporting on packet corruption
653  + fixed it so that we don't create the FIFO by the RPM
654  + made cl_status setgid so anyone can run it, and fixed exit codes
655  + eliminated a serious memory leak associated with client code
656  + packaged doc files which had been missed before
657  + fixed many many small bugs and memory leaks detected by BEAM
658  + added several new test cases
659  + fixed longstanding bug in plugin unloading
660  + fixed a shutdown hang problem
661  + several fixes for Solaris, FreeBSD
662  + Solaris packaging now included in base
663  + fixed a bug related to the apache resource agent not handling
664        quoted parameters
665  + added use_apphbd parameter to have heartbeat register
666        with apphbd instead of watchdog device when desired
667  + changed apphbd to default its config file to /etc
668  + added snmp subagent code
669  + added hbaping communications plugin
670  + added external STONITH plugin
671  + ldirectord: fixed a bug where real servers that were are
672        present in multiple virtual services will only be added
673        to one virtual service.
674
675* Mon May 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
676+ Version 1.2.2 (stable)
677  + Fixed several format string errors in communication plugins
678  + Fixed a bug which kept us from diagnosing errors in non-aliased interfaces
679  + Fixed a bug in ipaddr which caused an infinite loop when auto_failback on
680  + Updated Debian things...
681  + Added IPv6addr resource agent
682  + Added ibmhmc STONITH plugin
683  + Added cl_status command
684  + Fixed a bug regarding restarts when auto_failback is on...
685  + Fixed a couple of bugs in sha1 authentication method for very long keys
686  + Fixed a bug in the portblock resource agent so that it no longer blocks
687          ports on the loopback interface
688  + Increased the time allowed for split brain test before it declares failure
689
690+ Version 1.2.1 (stable)
691  + Netstrings can now be used for our on-the-wire data format
692  + Perl/SWIG bindings added for some heartbeat libraries
693  + Significant improvements to SAF data checkpointing API
694  + Implemented unbuffered ipcsocket code for SAF APIs
695  + Many Solaris fixes -- except for ipfail, Solaris works
696  + Significant library restructuring
697  + Watchdog device NOWAYOUT is now overridded if defaulted
698  + Watchdog device now kills machine instantly after deadtime
699        instead of after one minute
700  + Hostnames should now be treated case-independently...
701  + Added new client status APIs - client_status() and cstatus_callback()
702  + Fixed bug with auto_failback and quick full restarts
703  + We now automatically reboot when resources fail to stop correctly...
704  + We now check the status of the configured STONITH device hourly...
705  + STONITH operations repeat after a 5 second delay, not immediately...
706  + Added hb_takeover command - complement to hb_standby
707  + Added documentation on how to use evlog/TCP to enable testing to
708        take place without losing messages due to UDP message forwarding
709  + Several new tests from Mi, Jun - split brain, bandwidth, failure
710        detection time.
711  + Fix to LVM resource from Harald Milz <hm@muc.de>
712  + Fixed FreeBSD authentication problems breaking ipfail
713  + Fixed .so loading on Debian
714  + Fixed false complaints about resource scripts (from Jens Schmalzing)
715  + Fixed false stop failure from LinuxSCSI  (from Jens Schmalzing <j.s@lmu.de>)
716
717
718
719* Thu Apr 15 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
720+ Version 1.3.0 - beta series
721  + Netstrings can now be used for our on-the-wire data format
722  + Perl/SWIG bindings added for some heartbeat libraries
723  + Significant improvements to SAF data checkpointing API
724  + Implemented unbuffered ipcsocket code for SAF APIs
725  + Many Solaris fixes -- except for ipfail, Solaris works
726  + Significant library restructuring
727  + Watchdog device NOWAYOUT is now overridded if defaulted
728  + Watchdog device now kills machine instantly after deadtime
729        instead of after one minute
730  + Hostnames should now be treated case-independently...
731  + Added new client status APIs - client_status() and cstatus_callback()
732  + Fixed bug with auto_failback and quick full restarts
733  + We now automatically reboot when resources fail to stop correctly...
734  + We now check the status of the configured STONITH device hourly...
735  + STONITH operations repeat after a 5 second delay, not immediately...
736  + Added hb_takeover command - complement to hb_standby
737  + Added documentation on how to use evlog/TCP to enable testing to
738        take place without losing messages due to UDP message forwarding
739  + Several new tests from Mi, Jun - split brain, bandwidth, failure
740        detection time.
741  + Fix to LVM resource from Harald Milz <hm@muc.de>
742
743* Tue Feb 16 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
744+ Version 1.2.0
745  + Replaced the nice_failback option with the auto_failback option.
746        THIS OBSOLETES THE NICE_FAILBACK OPTION. READ THE DOCS FOR HOW
747        TO UPGRADE SMOOTHLY.
748  + Added a new feature to hb_standby which allows you to give up
749          any specific category of resources:  local, foreign, or all.
750        The old behavior is "all" which is the default.
751        This allows you to put a auto_failback no cluster into
752          an active/active configuration on demand.
753  + ipfail now works properly with auto_failback on (active/active)
754  + ipfail now has "hysteresis" so that it doesn't respond immediately
755        to a network failure, but waits a little while so that the
756        damage can be properly assessed and extraneous takeovers avoided
757  + Added new ping node timeout directive "deadping"
758  + Made sure heartbeat preallocated stack and heap, and printed a
759        message if we allocate heap once we're started up...
760  + IPMILan STONITH plugin added to CVS
761  + Added IPaddr2 resource script
762  + Made the APC smart UPS ups code compatible with more UPSes
763  + Added a (preliminary?) ordered messaging facility from Yi Zhu
764  + Changed IPaddr's method of doing ARPs in background so that
765        certain timing windows were closed.
766  + Added OCF (wrapper) resource script
767  + Allow respawn programs to take arguments
768  + Added pinggroups (where any node being up is OK)
769  + SIGNIFICANT amount of internal rearchitecture.
770  + Many bug fixes.
771  + Several documentation updates.
772
773* Tue Feb 10 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
774+ Version 1.1.5
775  + ipfail now has "hysteresis" so that it doesn't respond immediately
776        to a network failure, but waits a little while so that the
777        damage can be properly assessed and extraneous takeovers avoided
778  + Several fixes to cl_poll()
779  + More fixes to the IPC code - especially handling data reception
780        after EOF
781  + removed some unclean code from GSource for treating EOF conditions
782  + Several bugs concerning hanging when shutting down early during startup
783  + A few BasicSanityCheck bug fixes
784  + CTS now allows a single machine to be able to monitor several clusters
785  + Most former CTS options are now either unneeded or on the command line
786  + Increased number of ARPs and how long they're being sent out
787  + Fixed uncommon (authorization) memory leak
788  + Some Solaris portability fixes.
789  + Made init script handle standby correctly for new config files
790  + Improved the fast failure detection test
791  + Added some backwards compatibility for nice_failback and some default
792        authentication directives
793  + Corrected the 1.1.4 change log
794 
795
796* Fri Jan 22 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
797+ Version 1.1.4
798  + ipfail now works properly with auto_failback on (active/active)
799  + Changed the API to use sockets (IPC library) instead of FIFOs.
800  + Added new apiauth directives to provide authorization information
801        formerly provided by the FIFO permissions.
802  + Added Intel's implementation of the SAF data checkpointing API and daemon
803  + Added a cleanup suggested by Emily Ratliff.
804  + IPMILan STONITH plugin added to CVS
805  + Added IPaddr2 resource script
806  + Various cleanups due to horms.
807  + Fixed authentication to work on 64-bit platforms(!)
808  + Fixed the cl_poll() code to handle corner cases better
809  + Made heartbeat close watchdog device before re-execing itself
810  + New CTS improvements from Mi, Jun <jun.mi@intel.com>
811  + Various minor bug fixes.
812      . Several shutdown bugs addressed
813      . fixed sendarp to make a pid file, so we can shut it down
814          when we shut everything else down in case it's still running.
815      . Lots of minor bug fixes to IPC code
816      . Lots of minor bug fixes to ipctest program
817      . made BasicSanityCheck more tolerant of delays
818      . Fixed IPC code to authenticate based on ints, not int*s.
819      . Check properly for strnlen instead of strlen...
820      . Several signed/unsigned fixes
821      . A few uninitialized vars now are inited
822      . Switched to compiling lex/yacc sources the automake way
823      . Lots of minor CTS fixes...
824
825  + ldirectord bug fixes:
826    . When new real servers are added on initialisation or when
827        the configuration file is reread they are marked with status
828        of -1 (uninitialised) so they will be checked and inserted
829        into the virtual service as required
830    . All checks use the checkport if set, otherwise the port set for
831        the individual real server. This was the case for http and
832        connect checks, but others had variations on this theme.
833    . When the configuration file is reread because it changed
834        on disk and autoreload is set, check the real servers
835        immediately rather than waiting for checkinterval to expire
836    . Already running message sent to stderr instead of stdout
837    . Support alternate server in real-server specific URL
838    . Treat the same real server with different weights as a different
839        real server. Fixes bug reported by Philip Hayward whereby the same
840        real-server would always have the same weight, regardless of
841        the ldirectord.cf
842
843* Fri Sep 26 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
844+ Version 1.1.3
845  + Bugfix for heartbeat starting resources twice concurrently if
846    auto_failback was set to "legacy".
847  + Bugfix for messages getting lost if messages were sent in quick
848    succession. (Kurosawa Takahiro)
849  + Bugfix for Filesystem resource checking for presence of filesystem
850    support before loading the module.
851  + BasicSanityCheck extended to cover more basic tests.
852  + Bugfix for findif not working correctly for CIDR netmasks.
853  + Minor bugfix for ldirectord recognizing new schedulers correctly and
854    timeout settings are now being honoured.
855  + Enhanced the message giving a better explanation of how to set up node
856    names properly when current node not found in the ha.cf file
857  + Send a message to the cluster whenever we have a node which doesn't
858    need STONITHing - even though it's gone down.  This fix needed
859    by CCM, which is in turn needed by EVMS.
860  + Enhanced the messages for missing ha.cf and missing haresources files
861    explaining that sample config files are found in the documentation.
862  + Fix for memory leak from Forrest Zhao<forrest.zhao@intel.com>
863  + Added a (preliminary?) ordered messaging facility from Yi Zhu
864  + FAQ updates
865  + Added Xinetd resource script
866  + Added OCF (wrapper) resource script
867  + Allow respawn programs to take arguments
868  + Added pinggroups (where any node being up is OK)
869  + fixed ldirectord negotiatetimeout for HTTP
870  + fixed a bug which caused -d flag to be ignored
871  + failing resource scripts are now ERRORs not WARNings
872  + now shuts down correctly when auto_failback == legacy
873
874
875* Mon Jul 13 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
876+ Version 1.1.2
877  + Replaced the nice_failback option with the auto_failback option.
878        THIS OBSOLETES THE NICE_FAILBACK OPTION. READ THE DOCS FOR HOW
879        TO UPGRADE SMOOTHLY.
880  + Changed IPaddr to not do ARPs in background, and shortened time
881        between ARPs.  Also made these things tunable...
882  + changed our comm ttys to not become our controlling TTYs
883  + Enhanced the ServeRAID script to fix a critical bug by using a new feature
884  + Added a new DirectoryMap to CVS - tells where everything is...
885  + significantly enhanced the BasicSanityCheck script, and the tests
886        it calls.
887  + added a new option to use a replacement poll function for improved
888        real-time performance.
889  + added the ability to have a cluster node's name be different
890        from it's uname -n
891  + Moved where CTS gets installed to /usr/lib/heartbeat/cts
892  + Big improvements to the CTS README from IBM test labs in Austin.
893  + bug fixes to the WTI NPS power switch
894  + new client API calls:
895        return arbitrary configuration parameters
896        return current resource status
897  + Added a new clplumbing function: mssleep()
898  + added new capabilities for supporting pseudo-resources
899  + added new messages which come out after initial takeover is done
900         (improves CTS results)
901  + LOTS of documentation updates.
902  + fixed a security vulnerability
903  + fixed a bug where heartbeat would shut down while in the middle
904        of processing resource movement requests.
905  + changed compilation flags to eliminate similar future security
906        issues
907  + went to even-more-strict gcc flags
908  + fixed several "reload" bugs.  Now reload works ;-)
909  + fixed STONITH bug when other node never heard from.
910  + Minor bug fixes (cleaned up corrupted message)
911  + Two different client API bugs fixed.
912  + changed the configure script to test which warning flags are
913        supported by the current gcc.
914  + enhanced the API test program to test new capabilities...
915
916
917* Wed May 21 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
918+ Version 1.1.1
919  + Significant restructuring of the processes in heartbeat
920  + Added a new feature to hb_standby which allows you to give up
921          any specific category of resources:  local, foreign, or all.
922        The old behavior is "all" which is the default.
923        This allows you to put a nice_failback cluster into
924          an active/active configuration
925  + Enhancements to the ServeRAID code to make it work with the new
926    (supported) version of IPSSEND from the ServeRAID folks...
927  + Added STONITH code for the Dell remote access controller
928  + Fixed a major bug which kept it from taking over correctly after 246
929        days or so
930  + Fixed a major bug where heartbeat didn't lock itself into memory
931        properly
932  + Added new ping node timeout directive "deadping"
933  + Made sure heartbeat preallocated stack and heap, and printed a
934        message if we allocate heap once we're started up...
935  + Minor heartbeat API bug fixes
936  + Minor documentation fixes
937  + Minor fix to allow IP addresses with /32 masks...
938  + Fixed a timing window for !nice_failback resource acquisition
939  + Added several CCM bug fixes
940  + Made the APC smart UPS ups code compatible with more UPSes
941  + Fixed a bug in respawn
942  + Enhanced internal checking for malloc errors...
943  + Added IP alias search optimization from Sean Reifscheneider
944
945* Wed Mar 19 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
946+ Version 1.0.2:
947  + Fixed comment errors in heartbeat init script to allow it to run on RH 8.0
948  + Changed apphbd to use poll(2) instead of sigtimedwait(2)
949  + Put missing files into tarball
950  + Documentation improvements for IPaddr and other things
951  + Fixed an error in hb_standby which kept it from working if releasing
952    resources takes more than 10 seconds
953  + Added a fix to allow heartbeat to run on systems without writable disk
954    (like routers booting from CD-ROM)
955  + Added configuration file for apphbd
956  + Added fix from Adam Li to keep recoverymgr stop looping at high priority
957  + Added fix to ServeRAID resource to make it work with (new) supported
958    hardware
959  + Added Delay resource script
960  + Added fix to Filesystem to allow it to support NFS mounts and allow
961    user to specify mount options
962  + Added fix to IPaddr to make tmp directory for restoring loopback device
963  + Added fix to ipcsocket code to deal correctly with EAGAIN when sending
964    message body
965
966* Mon Feb 17 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
967+ Version 1.0.1:
968  + Fixed some compile errors on different platforms, and library versions
969  + Disable ccm from running on 'ping' nodes
970  + Put in Steve Snodgrass' fix to send_arp to make it work on non-primary
971        interfaces.
972
973* Thu Feb 13 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
974+ Version 1.0.1 beta series
975
976  0.4.9g:
977  + Changed default deadtime, warntime, and heartbeat interval
978  + Auto* tool updates
979  + VIP loopback fixes for IP address takeover
980  + Various Solaris and FreeBSD fixes
981  + added SNMP agent
982  + Several CCM bug fixes
983  + two new heartbeat API calls
984  + various documentation fixes, including documentation for ipfail
985  + Numerous minor cleanups.
986  + Fixed a few bugs in the IPC code.
987  + Fixed the (IPC) bug which caused apphbd to hang the whole machine.
988  + Added a new IPC call (waitout)
989  + Wrote a simple IPC test program.
990  + Clarified several log messages.
991  + Cleaned up the ucast communications plugin
992  + Cleaned up for new C compilers
993  + Fixed permissions bug in IPC which caused apphbd to not be usable by all
994  + Added a new rtprio option to the heartbeat config file
995  + updated apphbtest program
996  + Changed ipfail to log things at same level heartbeat does
997
998
999* Sat Nov 30 2002  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
1000+ Version 0.5 beta series (now renamed to 1.0.1 beta series).
1001  0.4.9f:
1002  + Added pre-start, pre-stop, post-stop and pre-stop constructs in init script
1003  + various IPC fixes
1004  + Fix to STONITH behavior: STONITH unresponsive node right after we reboot
1005  + Fixed extreme latency in IPC code
1006  + various configure.in cleanups
1007  + Fixed memory leak in IPC socket code
1008  + Added streamlined mainloop/IPC integration code
1009  + Moved more heartbeat internal communication to IPC library
1010  + Added further support for ipfail
1011  + Added supplementary groups to the respawn-ed clients
1012  + Added standby to init script actions
1013  + Lots of minor CCM fixes
1014  + Split (most) resource management code into a separate file.
1015  + Fixes to accommodate different versions of libraries
1016  + Heartbeat API client headers fixup
1017  + Added new API calls
1018  + Simplified (and fixed) handling of local status.  This would sometimes cause
1019        obscure failures on startup.
1020  + Added new IPsrcaddr resource script
1021
1022  KNOWN BUGS:
1023  + apphbd goes into an infinite loop on some platforms
1024
1025* Wed Oct 9 2002  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
1026  0.4.9e:
1027  + Changed client code to keep write file descriptor open at all times
1028        (realtime improvement)
1029  + Added a "poll replacement"  function based on sigtimedwait(2), which
1030        should be faster for those cases that can use it.
1031  + Added a hb_warntime() call to the application heartbeat API.
1032  + Changed all times in the configuration file to be in milliseconds
1033        if specified with "ms" at the end.  (seconds is still the default).
1034  + Fixes to serious security issue due to Nathan Wallwork <nwallwo@pnm.com>
1035  + Changed read/write child processes to run as nobody.
1036  + Fixed a bug where ping packets are printed incorrectly when debugging.
1037  + Changed heartbeat code to preallocate a some heap space.
1038  + CCM daemon API restructuring
1039  + Added ipc_channel_pair() function to the IPC library.
1040  + Changed everything to use longclock_t instead of clock_t
1041  + Fixed a bug concerning the ifwalk() call on ping nodes in the API
1042  + Made apphbd run at high priority and locked into memory
1043  + Made a library for setting priority up.
1044  + Made ucast comm module at least be configurable and loadable.
1045  + Fixed a startup/shutdown timing problem.
1046
1047  0.4.9d:
1048  + removed an "open" call for /proc/loadavg (improve realtime behavior)
1049  + changed API code to not 1-char reads from clients
1050  + Ignored certain error conditions from API clients
1051  + fixed an obscure error message about trying to retransmit a packet
1052        which we haven't sent yet.  This happens after restarts.
1053  + made the PILS libraries available in a separate package
1054  + moved the stonith headers to stonith/... when installed
1055  + improved debugging for NV failure cases...
1056  + updated AUTHORS file and simplified the changelog authorship
1057        (look in AUTHORS for the real story)
1058  + Added Ram Pai's CCM membership code
1059  + Added the application heartbeat code
1060  + Added the Kevin Dwyer's ipfail client code to the distribution
1061  + Many fixes for various tool versions and OS combinations.
1062  + Fixed a few bugs related to clients disconnecting.
1063  + Fixed some bugs in the CTS test code.
1064  + Added BasicSanityCheck script to tell if built objects look good.
1065  + Added PATH-like capabilities to PILS
1066  + Changed STONITH to use the new plugin system.
1067  + *Significantly* improved STONITH usage message (from Lorn Kay)
1068  + Fixed some bugs related to restarting.
1069  + Made exit codes more LSB-compliant.
1070  + Fixed various things so that ping nodes don't break takeovers.
1071
1072  0.4.9c and before:
1073  + Cluster partitioning  now handled correctly (really!)
1074  + Complete rearchitecture of plugin system
1075  + Complete restructure of build system to use automake and port things
1076        to AIX, FreeBSD and solaris.
1077  + Added Lclaudio's "standby" capability to put a node into standby
1078        mode on demand.
1079  + Added code to send out gratuitous ARP requests as well as gratuitous
1080        arp replies during IP address takeover.
1081  + Suppress stonith operations for nodes which went down gracefully.
1082  + Significantly improved real-time performance
1083  + Added new unicast heartbeat type.
1084  + Added code to make serial ports flush stale data on new connections.
1085  + The Famous CLK_TCK compile time fixes (really!)
1086  + Added a document which describes the heartbeat API
1087  + Changed the code which makes FIFOs to not try and make the FIFOs for
1088        named clients, and several other minor API client changes.
1089  + Fixed a fairly rare client API bug where it would shut down the
1090        client for no apparent reason.
1091  + Added stonith plugins for: apcmaster, apcmastersnmp switches, and ssh
1092        module (for test environments only)
1093  + Integrated support for the Baytech RPC-3 switch into baytech module
1094  + Fixes to APC UPS plugin
1095  + Got rid of "control_process: NULL message" message
1096  + Got rid of the "controlfifo2msg: cannot create message" message
1097  + Added -h option to give usage message for stonith command...
1098  + Wait for successful STONITH completion, and retry if its configured.
1099  + Sped up takeover code.
1100  + Several potential timing problems eliminated.
1101  + Cleaned up the shutdown (exit) code considerably.
1102  + Detect the death of our core child processes.
1103  + Changed where usage messages go depending on exit status from usage().
1104  + Made some more functions static.
1105  + Real-time performance improvement changes
1106  + Updated the faqntips document
1107  + Added a feature to heartbeat.h so that log messages get checked as
1108        printf-style messages on GNU C compilers
1109  + Changed several log messages to have the right parameters (discovered
1110        as a result of the change above)
1111  + Numerous FreeBSD, Solaris and OpenBSD fixes.
1112  + Added backwards compatibility kludge for udp (versus bcast)
1113  + Queued messages to API clients instead of throwing them away.
1114  + Added code to send out messages when clients join, leave.
1115  + Added support for spawning and monitoring child clients.
1116  + Cleaned up error messages.
1117  + Added support for DB2, ServeRAID and WAS, LVM, and Apache (IBMhttp too),
1118    also ICP Vortex controller.
1119  + Added locking when creating new IP aliases.
1120  + Added a "unicast" media option.
1121  + Added a new SimulStart and standby test case.
1122  + Diddled init levels around...
1123  + Added an application-level heartbeat API.
1124  + Added several new "plumbing" subsystems (IPC, longclock_t, proctrack, etc.)
1125  + Added a new "contrib" directory.
1126  + Fixed serious (but trivial) bug in the process tracking code which caused
1127        it to exit heartbeat - this occured repeatably for STONITH operations.
1128  + Write a 'v' to the watchdog device to tell it not to reboot us when
1129        we close the device.
1130  + Various ldirectord fixes due to Horms
1131  + Minor patch from Lorn Kay to deal with loopback interfaces which might
1132        have been put in by LVS direct routing
1133  + Updated AUTHORS file and moved list of authors over
1134
1135* Fri Mar 16 2001  Alan Robertson <alanr@unix.sh>
1136+ Version 0.4.9
1137
1138  + Split into 3 rpms - heartbeat, heartbeat-stonith heartbeat-ldirectord
1139
1140  + Made media modules and authentication modules and stonith modules
1141        dynamically loadable.
1142
1143  + Added Multicast media support
1144  + Added ping node/membership/link type for tiebreaking.  This will
1145        be useful when implementing quorum on 2-node systems.
1146        (not yet compatible with nice_failback(?))
1147  + Removed ppp support
1148
1149  + Heartbeat client API support
1150
1151  + Added STONITH API library
1152    +   support for the Baytech RPC-3A power switch
1153    +   support for the APCsmart UPS
1154    +   support for the VACM cluster management tool
1155    +   support for WTI RPS10
1156    +   support for Night/Ware RPC100S
1157    +   support for "Meatware" (human intervention) module
1158    +   support for "null" (testing only) module
1159
1160  + Fixed startup timing bugs
1161  + Fixed shutdown sequence bugs: takeover occured before
1162        resources were released by other system
1163  + Fixed various logging bugs
1164  + Closed holes in protection against replay attacks
1165
1166  + Added checks that complain if all resources aren't idle on startup.
1167  + IP address takeover fixes
1168      + Endian fixes
1169      + Removed the 8-alias limitation
1170      + Takeovers now occur faster (ARPs occur asynchronously)
1171
1172  + Port number changes
1173    + Use our IANA port number (694) by default
1174    + Recognize our IANA port number ("ha-cluster") if it's in /etc/services
1175
1176  + Moved several files, etc. from /var/run to /var/lib/heartbeat
1177  + Incorporated new ldirectord version
1178  + Added late heartbeat warning for late-arriving heartbeats
1179  + Added detection of and partial recovery from cluster partitions
1180  + Accept multiple arguments for resource scripts
1181  + Added Raid1 and Filesystem resource scripts
1182  + Added man pages
1183  + Added debian package support
1184
1185* Fri Jun 30 2000 Alan Robertson <alanr@unix.sh>
1186+ Version 0.4.8
1187  + Incorporated ldirectord version 1.9 (fixes memory leak)
1188  + Made the order of resource takeover more rational:  Takeover is now
1189    left-to-right, and giveup is right-to-left
1190  + Changed the default port number to our official IANA port number (694)
1191  + Regularized more messages, eliminated some redundant ones.
1192  + Print the version of heartbeat when starting.
1193  + Print exhaustive version info when starting with debug on.
1194  + Hosts now have 3 statuses {down, up, active} active means that it knows
1195        that all its links are operational, and it's safe to send cluster
1196        messages
1197  + Significant revisions to nice_failback (mainly due to lclaudio)
1198  + More SuSE-compatibility. Thanks to Friedrich Lobenstock <fl@fl.priv.at>
1199  + Tidied up logging so it can be to files, to syslog or both (Horms)
1200  + Tidied up build process (Horms)
1201  + Updated ldirectord to produce and install a man page and be
1202    compatible with the fwmark options to The Linux Virtual Server (Horms)
1203  + Added log rotation for ldirectord and heartbeat using logrotate
1204    if it is installed
1205  + Added Audible Alarm resource by Kirk Lawson <lklawson@heapy.com>
1206    and myself (Horms)
1207  + Added init script for ldirectord so it can be run independently
1208    of heartbeat (Horms)
1209  + Added sample config file for ldirectord (Horms)
1210  + An empty /etc/ha.d/conf/ is now part of the rpm distribution
1211    as this is where ldirectord's configuration belongs (Horms)
1212  + Minor startup script tweaks.  Hopefully, we should be able to make core
1213    files should we crash in the future.  Thanks to Holger Kiehl for diagnosing
1214    the problem!
1215  + Fixed a bug which kept the "logfile" option from ever working.
1216  + Added a TestCluster test utility.  Pretty primitive so far...
1217  + Fixed the serial locking code so that it unlocks when it shuts down.
1218  + Lock heartbeat into memory, and raise our priority
1219  + Minor, but important fix from lclaudio to init uninited variable.
1220
1221* Sat Dec 25 1999 Alan Robertson <alanr@unix.sh>
1222+ Version 0.4.7
1223  + Added the nice_failback feature. If the cluster is running when
1224        the primary starts it acts as a secondary. (Luis Claudio Goncalves)
1225  + Put in lots of code to make lost packet retransmission happen
1226  + Stopped trying to use the /proc/ha interface
1227  + Finished the error recovery in the heartbeat protocol (and got it to work)
1228  + Added test code for the heartbeat protocol
1229  + Raised the maximum length of a node name
1230  + Added Jacob Rief's ldirectord resource type
1231  + Added Stefan Salzer's <salt@cin.de> fix for a 'grep' in IPaddr which
1232        wasn't specific enough and would sometimes get IPaddr confused on
1233        IP addresses that prefix-matched.
1234  + Added Lars Marowsky-Bree's suggestion to make the code almost completely
1235        robust with respect to jumping the clock backwards and forwards
1236  + Added code from Michael Moerz <mike@cubit.at> to keep findif from
1237        core dumping if /proc/route can't be read.
1238
1239* Mon Nov 22 1999 Alan Robertson <alanr@unix.sh>
1240+ Version 0.4.6
1241  + Fixed timing problem in "heartbeat restart" so it's reliable now
1242  + Made start/stop status compatible with SuSE expectations
1243  + Made resource status detection compatible with SuSE start/stop expectations
1244  + Fixed a bug relating to serial and ppp-udp authentication (it never worked)
1245  + added a little more substance to the error recovery for the HB protocol.
1246  + Fixed a bug for logging from shell scripts
1247  + Added a little logging for initial resource acquisition
1248  + Added #!/bin/sh to the front of shell scripts
1249  + Fixed Makefile, so that the build root wasn't compiled into pathnames
1250  + Turned on CTSRTS, enabling for flow control for serial ports.
1251  + Fixed a bug which kept it from working in non-English environments
1252
1253* Wed Oct 13 1999 Alan Robertson <alanr@unix.sh>
1254+ Version 0.4.5
1255  + Mijta Sarp added a new feature to authenticate heartbeat packets
1256        using a variety of strong authentication techniques
1257  + Changed resource acquisition and relinquishment to occur in heartbeat,
1258       instead of in the start/stop script.  This means you don't *really*
1259       have to use the start/stop script if you don't want to.
1260  + Added -k option to gracefully shut down current heartbeat instance
1261  + Added -r option to cause currently running heartbeat to reread config files
1262  + Added -s option to report on operational status of "heartbeat"
1263  + Sped up resource acquisition on master restart.
1264  + Added validation of ipresources file at startup time.
1265  + Added code to allow the IPaddr takeover script to be given the
1266        interface to take over, instead of inferring it.  This was requested
1267        by Lars Marowsky-Bree
1268  + Incorporated patch from Guenther Thomsen to implement locking for
1269        serial ports used for heartbeats
1270  + Incorporated patch from Guenther Thomsen to clean up logging.
1271        (you can now use syslog and/or file logs)
1272  + Improved FreeBSD compatibility.
1273  + Fixed a bug where the FIFO doesn't get created correctly.
1274  + Fixed a couple of uninitialized variables in heartbeat and /proc/ha code
1275  + Fixed longstanding crash bug related to getting a SIGALRM while in malloc
1276        or free.
1277  + Implemented new memory management scheme, including memory stats
1278
1279* Thu Sep 16 1999 Alan Robertson <alanr@unix.sh>
1280+ Version 0.4.4
1281  + Fixed a stupid error in handling CIDR addresses in IPaddr.
1282  + Updated the documentation with the latest from Rudy.
1283
1284* Wed Sep 15 1999 Alan Robertson <alanr@unix.sh>
1285+ Version 0.4.3
1286  + Changed startup scripts to create /dev/watchdog if needed
1287  + Turned off loading of /proc/ha module by default.
1288  + Incorporated bug fix from Thomas Hepper <th@ant.han.de> to IPaddr for
1289        PPP configurations
1290  + Put in a fix from Gregor Howey <ghowey@bremer-nachrichten.de>
1291        where Gregor found that I had stripped off the ::resourceid part
1292        of the string in ResourceManager resulting in some bad calls later on.
1293  +  Made it compliant with the FHS (filesystem hierarchy standard)
1294  +  Fixed IP address takeover so we can take over on non-eth0 interface
1295  +  Fixed IP takeover code so we can specify netmasks and broadcast addrs,
1296        or default them at the user's option.
1297  +  Added code to report on message buffer usage on SIGUSR[12]
1298  +  Made SIGUSR1 increment debug level, and SIGUSR2 decrement it.
1299  +  Incorporated Rudy's latest "Getting Started" document
1300  +  Made it largely Debian-compliant.  Thanks to Guenther Thomsen, Thomas
1301        Hepper, I単aki Fern叩ndez Villanueva and others.
1302  +  Made changes to work better with Red Hat 6.1, and SMP code.
1303  +  Sometimes it seems that the Master Control Process dies :-(
1304
1305* Sat Aug 14 1999 Alan Robertson <alanr@unix.sh>
1306+ Version 0.4.2
1307  + Implemented simple resource groups
1308  + Implemented application notification for groups starting/stopping
1309  + Eliminated restriction on floating IPs only being associated with eth0
1310  + Added a uniform resource model, with IP resources being only one kind.
1311        (Thanks to Lars Marowsky-Bree for a good suggestion)
1312  + Largely rewrote the IP address takeover code, making it clearer, fit
1313        into the uniform resource model, and removing some restrictions.
1314  + Preliminary "Getting Started" document by Rudy Pawul
1315  + Improved the /proc/ha code
1316  + Fixed memory leak associated with serial ports, and problem with return
1317        of control to the "master" node.
1318        (Thanks to Holger Kiehl for reporting them, and testing fixes!)
1319
1320* Tue Jul 6 1999 Alan Robertson <alanr@unix.sh>
1321+ Version 0.4.1
1322  + Fixed major memory leak in 0.4.0 (oops!)
1323  + Added code to eliminate duplicate packets and log lost ones
1324  + Tightened up PPP/UDP startup/shutdown code
1325  + Made PPP/UDP peacefully coexist with "normal" udp
1326  + Made logs more uniform and neater
1327  + Fixed several other minor bugs
1328  + Added very preliminary kernel code for monitoring and controlling
1329        heartbeat via /proc/ha.  Very cool, but not really done yet.
1330
1331* Wed Jun 30 1999 Alan Robertson <alanr@unix.sh>
1332+ Version 0.4.0
1333  + Changed packet format from single line positional parameter style
1334        to a collection of {name,value} pairs.  A vital change for the future.
1335  + Fixed some bugs with regard to forwarding data around rings
1336  + We now modify /etc/ppp/ip-up.local, so PPP-udp works out of the box
1337        (at least for Red Hat)
1338  + Includes the first version of Volker Wiegand's Hardware Installation Guide
1339        (it's pretty good for a first version!)
1340
1341* Wed Jun 09 1999 Alan Robertson <alanr@unix.sh>
1342+ Version 0.3.2
1343  + Added UDP/PPP bidirectional serial ring heartbeat
1344        (PPP ensures data integrity on the serial links)
1345  + fixed a stupid bug which caused shutdown to give unpredictable
1346        results
1347  + added timestamps to /var/log/ha-log messages
1348  + fixed a couple of other minor oversights.
1349
1350* Sun May 10 1999  Alan Robertson <alanr@unix.sh>
1351+ Version 0.3.1
1352  + Make ChangeLog file from RPM specfile
1353  + Made ipresources only install in the DOC directory as a sample
1354
1355* Sun May 09 1999 Alan Robertson <alanr@unix.sh>
1356+ Version 0.3.0
1357  + Added UDP broadcast heartbeat (courtesy of Tom Vogt)
1358  + Significantly restructured code making it easier to add heartbeat media
1359  + added new directives to config file:
1360    + udp interface-name
1361    + udpport port-number
1362    + baud    serial-baud-rate
1363  + made manual daemon shutdown easier (only need to kill one)
1364  + moved the sample ha.cf file to the Doc directory
1365
1366* Sat Mar 27 1999 Alan Robertson <alanr@unix.sh>
1367+ Version 0.2.0
1368  + Make an RPM out of it
1369  + Integrated IP address takeover gotten from Horms
1370  + Added support to tickle a watchdog timer whenever our heart beats
1371  + Integrated enough basic code to allow a 2-node demo to occur
1372  + Integrated patches from Andrew Hildebrand <andrew@pdi.com> to allow it
1373    to run under IRIX.
1374  - Known Bugs
1375    - Only supports 2-node clusters
1376    - Only supports a single IP interface per node in the cluster
1377    - Doesn't yet include Tom Vogt's ethernet heartbeat code
1378    - No documentation
1379    - Not very useful yet :-)
1380
1381###########################################################
Note: See TracBrowser for help on using the repository browser.