source: projects/specs/trunk/h/heartbeat/heartbeat-vl.spec @ 3024

Revision 3024, 60.3 KB checked in by Takemikaduchi, 13 years ago (diff)

heartbeat: rollback

Line 
1%define           ENABLE_SNMP_SUBAGENT 0
2%define           ENABLE_MGMT 1
3%define           uid 24
4%define           gname haclient
5%define           uname hacluster
6
7Summary:          Heartbeat subsystem for High-Availability Linux
8Summary(ja):      高可用性 Linux のための HeartBeat サブシステム
9Name:             heartbeat
10Version:          2.0.8
11Release:          5%{_dist_release}
12
13Group:            System Environment/Daemons
14License:          GPL/LGPL
15URL:              http://linux-ha.org/
16
17Source0:          http://linux-ha.org/download/%{name}-%{version}.tar.gz
18Patch0:           heartbeat-fedora-pam.patch
19Patch1:           heartbeat-fedora-chkconfig.patch
20
21BuildRoot:        %{_tmppath}/%{name}-%{version}-root
22BuildRequires:    glib2-devel
23BuildRequires:    iputils
24BuildRequires:    libnet-devel
25BuildRequires:    libtool-ltdl-devel
26BuildRequires:    net-snmp-devel
27BuildRequires:    bzip2-devel
28BuildRequires:    ncurses-devel
29%if %{ENABLE_MGMT}
30BuildRequires:    gnutls-devel > 2
31BuildRequires:    pam-devel
32BuildRequires:    python-devel
33BuildRequires:    swig
34BuildRequires:    curl-devel
35%endif
36Requires:         stonith = %{version}-%{release}
37Requires:         pils = %{version}-%{release}
38Requires:         ldirectord = %{version}-%{release}
39Requires:         pygtk2 >= 2.4
40Requires(post):   /sbin/chkconfig
41Requires(preun):  /sbin/chkconfig
42%if %{ENABLE_MGMT}
43Requires:         gettext
44%endif
45
46%description
47heartbeat is a basic high-availability subsystem for Linux-HA.
48It will run scripts at initialization, and when machines go up or down.
49This version will also perform IP address takeover using gratuitous ARPs.
50It supports "n-node" clusters with significant capabilities for managing
51resources and dependencies.
52
53In addition it continues to support the older release 1 style of
542-node clustering.
55
56It implements the following kinds of heartbeats:
57        - Serial ports
58        - UDP/IP multicast (ethernet, etc)
59        - UDP/IP broadcast (ethernet, etc)
60        - UDP/IP heartbeats
61        - "ping" heartbeats (for routers, switches, etc.)
62           (to be used for breaking ties in 2-node systems)
63
64%package -n ldirectord
65Summary:          Monitor daemon for maintaining high availability resources
66Summary(ja):      高可用リソースを管理するための監視デーモン
67Group:            System Environment/Daemons
68Requires:         ipvsadm
69Requires:         %{name} = %{version}
70Requires(post):   /sbin/chkconfig
71Requires(preun):  /sbin/chkconfig
72
73%description -n ldirectord
74ldirectord is a stand-alone daemon to monitor services of real
75for virtual services provided by The Linux Virtual Server
76(http://www.linuxvirtualserver.org/). It is simple to install
77and works with the heartbeat code (http://www.linux-ha.org/).
78
79%package -n stonith
80Summary:        Provides an interface to Shoot The Other Node In The Head
81Group:          System Environment/Daemons
82Requires:       pils = %{version}-%{release}
83
84%description -n stonith
85The STONITH module (a.k.a. STOMITH) provides an extensible interface
86for remotely powering down a node in the cluster.  The idea is quite simple:
87When the software running on one machine wants to make sure another
88machine in the cluster is not using a resource, pull the plug on the other
89machine. It's simple and reliable, albeit admittedly brutal.
90#'
91
92%package -n pils
93Summary:        Provides a general plugin and interface loading library
94Group:          System Environment/Daemons
95
96%description -n pils
97PILS is an generalized and portable open source Plugin and Interface Loading
98System. PILS was developed as part of the Open Cluster Framework reference
99implementation, and is designed to be directly usable by a wide variety of
100other applications.
101PILS manages both plugins (loadable objects), and the interfaces these plugins
102implement. PILS is designed to support any number of plugins implementing any
103number of interfaces.
104
105%package devel
106Summary:        Heartbeat development package
107Summary(ja):    Heartbeat 開発パッケージ
108Group:          Development/Libraries
109Requires:       heartbeat = %{version}-%{release}
110
111%description devel
112Heartbeat development package
113
114%prep
115%setup -q
116%patch0 -p1
117%patch1 -p1
118 
119%build
120# disable-fatal-warnings flag used to disable gcc4.x warnings of 'difference in signedness'
121CFLAGS=${RPM_OPT_FLAGS} \
122%configure \
123  --disable-fatal-warnings \
124  --disable-static \
125%if %{ENABLE_MGMT}
126  --enable-mgmt
127%else
128  --disable-mgmt
129%endif
130make
131
132%install
133rm -rf $RPM_BUILD_ROOT
134mkdir -p $RPM_BUILD_ROOT
135make DESTDIR=$RPM_BUILD_ROOT install
136(
137  cd $RPM_BUILD_ROOT/etc/ha.d/resource.d
138  ln -s /usr/sbin/ldirectord ldirectord
139)
140
141mkdir -p $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/conf
142
143# cleanup
144[ -d $RPM_BUILD_ROOT/usr/man ] && rm -rf $RPM_BUILD_ROOT/usr/man
145[ -d $RPM_BUILD_ROOT/usr/share/libtool ] && rm -rf $RPM_BUILD_ROOT/usr/share/libtool
146find $RPM_BUILD_ROOT -type f -name *.la -exec rm -f {} ';'
147
148sed -i -e '1i# -*-Shell-script-*-' $RPM_BUILD_ROOT/%{_libdir}/heartbeat/ocf-shellfuncs
149sed -i -e '1i# -*-Shell-script-*-' $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/shellfuncs
150chmod -x $RPM_BUILD_ROOT/%{_libdir}/heartbeat/ocf-shellfuncs
151chmod -x $RPM_BUILD_ROOT/%{_sysconfdir}/ha.d/shellfuncs
152chmod -x $RPM_BUILD_ROOT/%{_libdir}/heartbeat-gui/pymgmt.py
153
154%clean
155if [ -n "${RPM_BUILD_ROOT}"  -a "${RPM_BUILD_ROOT}" != "/" ]; then
156  rm -rf $RPM_BUILD_ROOT
157fi
158
159%pre
160/usr/sbin/groupadd -g %{uid} %{gname} &>/dev/null || :
161/usr/sbin/useradd -M -r -u %{uid} -s /sbin/nologin -d /var/lib/heartbeat/cores/hacluster \
162        -c 'heartbeat user' -g %{gname} %{uname} &>/dev/null || :
163
164%post
165/sbin/ldconfig
166/sbin/chkconfig --add heartbeat
167
168%preun
169/sbin/chkconfig --del heartbeat
170
171%postun
172/sbin/ldconfig
173test "$1" != 0 || /usr/sbin/userdel  %{uname} &>/dev/null || :
174test "$1" != 0 || /usr/sbin/groupdel %{gname} &>/dev/null || :
175
176%post -n ldirectord
177/sbin/chkconfig --add ldirectord
178
179%preun -n ldirectord
180/sbin/chkconfig --del ldirectord
181
182%post -n stonith -p /sbin/ldconfig
183
184%postun -n stonith -p /sbin/ldconfig
185
186%files
187%doc %{_datadir}/doc/%{name}-%{version}
188%defattr(-,root,root)
189%dir %{_sysconfdir}/ha.d
190%{_sysconfdir}/ha.d/harc
191%config(noreplace) %{_sysconfdir}/ha.d/shellfuncs
192%{_sysconfdir}/ha.d/rc.d
193%config(noreplace) %{_sysconfdir}/ha.d/README.config
194%{_libdir}/heartbeat
195%{_libdir}/heartbeat-gui
196%{_libdir}/libapphb.so.*
197%{_libdir}/libccmclient.so.*
198%{_libdir}/libcib.so.*
199%{_libdir}/libclm.so.*
200%{_libdir}/libcrmcommon.so.*
201%{_libdir}/libtransitioner.so.*
202%{_libdir}/libhbclient.so.*
203%{_libdir}/liblrm.so.*
204%{_libdir}/libpengine.so.*
205%{_libdir}/libplumb.so.*
206%{_libdir}/libplumbgpl.so.*
207%{_libdir}/librecoverymgr.so.*
208%{_libdir}/libstonithd.so.*
209%{_prefix}/lib/ocf
210%{_sysconfdir}/ha.d/resource.d/
211%exclude %{_sysconfdir}/ha.d/resource.d/ldirectord
212%{_sysconfdir}/init.d/heartbeat
213%config(noreplace) %{_sysconfdir}/logrotate.d/heartbeat
214%dir %{_var}/lib/heartbeat
215%dir %{_var}/lib/heartbeat/cores
216%dir %attr (0755, root, root) %{_var}/lib/heartbeat/cores/root
217%dir %attr (0755, nobody, nobody) %{_var}/lib/heartbeat/cores/nobody
218%dir %attr (0755, hacluster, haclient) %{_var}/lib/heartbeat/cores/hacluster
219%dir %{_var}/run/heartbeat
220%attr (0755, hacluster, haclient) %{_bindir}/cl_status
221%{_bindir}/cl_respawn
222%{_sbindir}/crmadmin
223%{_sbindir}/cibadmin
224%{_sbindir}/ccm_tool
225%{_sbindir}/crm_diff
226%{_sbindir}/crm_uuid
227%{_sbindir}/crm_mon
228%{_sbindir}/crm_sh
229%{_sbindir}/iso8601
230%{_sbindir}/crm_master
231%{_sbindir}/crm_standby
232%{_sbindir}/crm_attribute
233%{_sbindir}/crm_resource
234%{_sbindir}/crm_verify
235%{_sbindir}/attrd_updater
236%{_sbindir}/crm_failcount
237%{_sbindir}/ocf-tester
238%dir %attr (755, hacluster, haclient) %{_var}/run/heartbeat/ccm
239%dir %attr (755, hacluster, haclient) %{_var}/run/heartbeat/crm
240%dir %attr (755, hacluster, haclient) %{_var}/lib/heartbeat/crm
241%dir %attr (755, hacluster, haclient) %{_var}/lib/heartbeat/pengine
242%{_mandir}/man1/cl_status.1*
243%{_mandir}/man1/ha_logger.1*
244%{_mandir}/man1/hb_standby.1*
245%{_mandir}/man1/hb_takeover.1*
246%{_mandir}/man1/hb_addnode.1*
247%{_mandir}/man1/hb_delnode.1*
248%{_mandir}/man8/heartbeat.8*
249%{_mandir}/man8/apphbd.8*
250%{_mandir}/man8/ha_logd.8*
251%{_mandir}/man8/cibadmin.8*
252%{_mandir}/man8/crm_resource.8*
253%if %{ENABLE_SNMP_SUBAGENT}
254/LINUX-HA-MIB.mib
255%endif
256%if %{ENABLE_MGMT}
257%{_libdir}/libhbmgmt.so.*
258%{_libdir}/libhbmgmtclient.so.*
259%{_libdir}/libhbmgmtcommon.so.*
260%{_libdir}/libhbmgmttls.so.*
261%config(noreplace) %{_sysconfdir}/pam.d/hbmgmtd
262%{_datadir}/locale/zh_CN/LC_MESSAGES/haclient.mo
263%endif
264
265%files -n ldirectord
266%doc doc/COPYING
267%doc doc/README
268%doc ldirectord/ldirectord.cf
269%defattr(-,root,root)
270%{_sysconfdir}/ha.d/conf
271%{_sbindir}/ldirectord
272%{_sbindir}/supervise-ldirectord-config
273%config(noreplace) %{_sysconfdir}/logrotate.d/ldirectord
274%{_sysconfdir}/init.d/ldirectord
275%{_sysconfdir}/ha.d/resource.d/ldirectord
276%{_mandir}/man8/ldirectord.8*
277%{_mandir}/man8/supervise-ldirectord-config.8*
278
279%files -n stonith
280%doc doc/COPYING
281%doc doc/README
282%defattr(-,root,root)
283%{_libdir}/*.so.*
284%{_libdir}/stonith/
285%{_sbindir}/stonith
286%{_sbindir}/meatclient
287%{_mandir}/man8/stonith.8*
288%{_mandir}/man8/meatclient.8*
289
290%files -n pils
291%doc doc/COPYING
292%doc doc/README
293%defattr(-,root,root)
294/usr/include/pils
295%{_libdir}/libpils.*
296%{_libdir}/pils/
297
298%files devel
299%doc %{_datadir}/doc/%{name}-%{version}
300%defattr(-,root,root)
301%{_includedir}/heartbeat/
302%{_includedir}/clplumbing/
303%{_includedir}/saf/
304%{_includedir}/ocf/
305%{_includedir}/stonith/
306%{_includedir}/pils/
307%{_libdir}/*.so
308
309%changelog
310* Sun Oct  3 2010 Ryoichi INAGAKI <ryo1@bc.wakwak.com> 2.0.8-5
311- rebuilt with new toolchain
312
313* Sun May 17 2009 Ryoichi INAGAKI <ryo1@bc.wakwak.com> 2.0.8-4
314- spec in UTF-8
315- changed devel Group to Development/Libraries
316
317* Tue May 05 2009 Satoshi IWAMOTO <satoshi.iwamoto@nifty.ne.jp> 2.0.8-3
318- new versioning policy
319- rebuild with gnutls 2.6.6, libtool 2.2.6 and curl 7.19.4
320- add BuildRequires: curl-devel
321
322* Sun Jan 06 2008 Shu KONNO <owa@bg.wakwak.com> 2.0.8-0vl2
323- rebuilt with net-snmp-5.4.1
324
325* Sat May 19 2007 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.8-0vl1
326- new upstream release
327- build with new environment
328
329* Mon Oct 30 2006 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.7-0vl2
330- rebuild with gnutls-1.4
331- add Japanese summaries
332
333* Mon Oct 23 2006 Daisuke SUZUKI <daisuke@linux.or.jp> 2.0.7-0vl1
334- initial build for Vine Linux based on FE package.
335
336* Wed Aug 30 2006 Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.7-2
337- rebuild for Fedora Extras 6
338
339* Wed Aug 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.7-1
340- upstream version 2.0.7
341
342* Sat Jul 15 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.6-2
343- added BuildReqs: ncurses-devel
344
345* Fri Jul 14 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.6-1
346- upstream version 2.0.6
347
348* Fri Jun 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.5-2
349- bump for gnutls change in devel
350
351* Thu Apr 27 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.5-1
352- upstream version 2.0.5
353- removed patch2 - ownership of /heartbeat/crm/cib.xml is no longer
354  set in cts/CM_LinuxHAv2.py.in
355
356* Wed Mar 29 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.4-2
357- Version 2.0.4
358
359* Wed Mar  1 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-9
360- changed user creation
361- added patch2 heartbeat-2.0.3-fedora-ccmuser.patch 
362
363* Wed Mar  1 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-8
364- specifically excluded ldirectord symlink from heartbeat package
365- removed user and group deletion in postun
366- renamed subpackages ldirectord, pils and stonith to lose prefix heartbeat
367  by using -n
368
369* Tue Feb 28 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-7
370- fixed more rpmlint errors and warnings
371
372* Sat Feb 25 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-6
373- fixed number of rpmlint warnings and errors (still ignores some..)
374- generate 'predictable' uid and gid with fedora-usermgmt to use with
375  configure flag -with-ccmuser-id and groupadd, useradd
376- added Buildreq's: libtool-ltdl-devel, fedora-usermgmt-setup
377  net-snmp-devel, bzip2-devel
378- removed *.so duplication in heartbeat and heartbeat-devel
379- changed file sections
380
381* Fri Feb 24 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-5
382- useradd with fedora-usermgmt
383- added *.so file to -devel sub-package
384
385* Sat Feb 18 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-4
386- removed all perl requires; should be picked up by rpmbuild automagically
387- changed system user creation hacluster part to use baseid:
388  (http://fedoraproject.org/wiki/Packaging/UserCreation)
389
390* Thu Feb 16 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-3
391- removed Requires: python and gnutls
392- changed _libdir/ocf -> _prefix/lib/ocf
393- reversed subpackages depend on basepackage
394- removed Req swig (kept BuildReq)
395- added Req pygtk2
396
397* Wed Feb 15 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-2
398- fixes for various rpmlint errors and warnings
399- fixed setup -q
400- make subpackages depend on basepackage, not reverse
401- clean buildroot at beginning of install
402- replaced a number of hardcoded paths with RPM macros
403- Changed Group from Networking/Daemons to System Environment/Daemons
404- enable mgmt option
405
406* Sun Feb 12 2006  Joost Soeterbroek <fedora@soeterbroek.com> - 2.0.3-1
407- rebuilt for Fedora Extras
408
409* Fri Feb 10 2006  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
410+ Version 2.0.3 - Bug fixes and significant new features.
411  + Management Daemon/Library and GUI client
412    + provide a management library for manamgement daemon and CIM provider
413    + provide a management daemon and a basic GUI management tool
414  + CIM enablement
415    + CIM (Common Information Model) enablement - works with
416      sblim-sfcb, OpenWBEM, and Pegasus CIMOMs
417    - not yet compiled into our binary RPMs because of dependencies
418  + CRM (Cluster Resource Manager) General
419    + All shutdowns go via the PE/TE - preserves inter-resource ordering
420    + Support for future changes to the CIB (depreciation of cib_fragment)
421    + Overhaul of IPC and HA channel callback logic
422    + Many improvments to the quality and quantity (reduced) of logging
423  + CRMd
424    + Timerless elections - when everyone has voted we're done
425    + Use the replace notification from the CIB to re-update our copy with
426      our view of our peers.
427    + Reliably detect if the LRM connection is still active.
428    + Elections
429      + newer versions defer to older ones in DC elections
430        (opposite of current behavior)
431      + this means that only once the complete cluster has been upgraded will
432        we start acting like the new version and accept new config options
433      + it also means newer PE's and TE's (the most complex pieces) don't need
434        "act like the old version" options and can rely on all slaves being at
435        least as up-to-date as they are
436      + people can run mixed clusters as long as they want
437        (until they want the new PE features)
438      + new DCs only update the version number in the CIB if they have a
439        higher value
440      + nodes that start and have a lower version than that stored in the CIB
441        shut themselves down (the CRM part anyway)
442      + this prevents an admin from introducing old nodes back into an upgraded
443        cluster. It probably doesn't fully understand the config and may not
444        support the actions the PE/TE requires.
445  + CIB (Common Information Base daemon)
446    + Make sure "query only" connections cant modify the CIB
447    + Periodically dump some stats about what the CIB has been doing.
448    + Verify there are no memory leaks
449    + Performance enhancements
450    + Prevent a single CIB client from blocking everyone else
451    + Clients Can be notified of full CIB replacements
452    + record_config_changes option in ha.cf for those worried about
453      the amount of logging.  Defaults to "on".
454    + suppress_cib_writes CIB option replaced with in enable_config_writes ha.cf
455      (enable_config_writes to be removed in 2.0.4)
456    + Never write the status section to disk
457    + Check permissions for the on-disk CIB at startup
458    + Dont trash unreadable on-disk CIBs
459    + Fix for updates made against the whole CIB (not just one section)
460  + PEngine (Policy Engine)
461    + Many improvements to the handling of resource groups
462    + Support "anonymous" clones
463    + Fix stonith ordering
464    + Order DC shutdowns after everyone else's
465    + Support short resource names (for group and clone resources)
466    + The ordering and colocation of grouped resources is now optional
467    + Support probing new nodes for active resources.
468    + All "probe" actions are controlled by the PE.
469      + No resource may be started until the probing is complete.
470      + Do not probe for resources we know to be active on unprobed nodes
471    + When looking for monitor ops, only mark it optional if it was already
472      active on the node we're interested in.
473    + Detect changes to class/type/provider/parameters and force a restart
474      of the resource
475    + New record_pengine_inputs option in ha.cf for those worried about
476      the amount of logging.  Defaults to "on".
477    + Differentiate between config and processing errors
478      + reduces the frequency that we need to log the complete CIB
479    + Make notify for master/slave work
480    + New CIB option: stop_orphan_actions (boolean)
481      If a resource is no longer defined, we can optionally stop it
482    + New CIB option: stop_orphan_actions (boolean)
483      If a monitor op for a given interval is no longer defined, we can
484      optionally stop it
485    + Add support for time and phase-of-the-moon based constraints
486    + Improved failure handling: avoiding false positives
487    + Always create orphaned resources - so they show up in crm_mon
488    + Do not require sequential clone numbers starting at 0
489  + TEngine (transition engine)
490    + Detect old stonith ops
491  + CLIs (Command Line interfaces)
492    + Create a --one-shot option for crm_mon
493    + Switch a number of CLI tools to use the new syncronous connections
494    + Log errors to stderr where they will be seen and therefore useful
495    + Support migration and un-migration of resources and resource groups
496    + Create crm_verify for checking configuration validity
497    + Simplify the passing of XML to cibadmin
498  + Known open bugs worth mentioning:
499    + 1075, 1080, 1081, 1084, 1085, 1064, 1069, 756, 984
500    + 1050, 1082, 1037, 1079
501   
502* Thu Sep 22 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
503+ Version 2.0.2 - small bug fix only release
504  + Fixed a bug in ping directive - it works again
505  + Added a check to BasicSanityCheck to check ping and ping_group directives
506  + fixed cl_status nodestatus to return 0 if a node has status "ping"
507  + fixed a memory leak in the CRM's LRM interface code
508  + fixed code which deterimines which version of the CRM becomes
509    the DC when basic CIB schema versions differ.  It now prefers
510    the older version to be DC instead of the newer version.
511
512* Wed Sep 14 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
513+ Version 2.0.1 -
514  + Communication Layer
515    + netstring encoding format is changed to be more efficient
516    + add compression capability for big messages
517  + Add man pages for hb_standby/hb_takeover   
518  + The assert triggered by 2.0.0 has been fixed
519  + CIB can now contain XML comments and/or be in DOS format   
520  + Includes implementation of the ISO8601 date format
521  + New CLI tools for changing cluster preferences, node attributes
522    and node standby
523  + Improved recovery and placement of group resources
524  + Detection of failed nodes by the Policy Engine is fixed
525  + New Policy Engine features
526    http://www.linux-ha.org/ClusterResourceManager/DTD1.0/Annotated :
527      sections 1.5.[8,9,10,12]
528    + Constraints and instance attributes can now be active conditionally
529    + Rules can now contain other rules
530    + Date/Time based expressions are supported
531    + Cloned resources can now optionally be notified before and after
532      any of its peers are stopped or started.
533    + The cluster can re-evaluate the configuration automatically after
534      a defined interval of idleness
535  + Removed a flow control message which was very annoying when operating
536    in a mixed 1.x/2.x environment
537  -- Known Bugs :-( --
538    - Bug 859 - FSA took too long to complete action - fully recovered from
539    - Bug 882 - IPC channel not connected during shutdown - harmless
540    - Bug 879 - Failed actions cause extra election - harmless
541 Each of these occurs about once or twice in 5000 test iterations
542       - This is probably > 10K failovers
543    - rsc_location constraints cannot have rules that contain other rules
544      (fixed in CVS after release)
545* Fri Jul 29 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
546+ Version 2.0.0 - First stable release of the next generation of the Linux-HA project
547  + Basic Characteristics described here:
548        http://linux-ha.org/FactSheetv2
549  + Core infrastructure improvments:
550    + Messaging (message acknowledging and flow control)
551    + Logging   (logging daemon)
552  + Release 1.x style (2-node) clusters fully supported
553  + Multi-node support (so far up to 16-node clusters tested)
554        See http://linux-ha.org/GettingStartedV2 for more information
555  + New components:
556    + Cluster Information Base    (replicated resource configuration)
557    + Cluster Resource Manager    (supporting 1->N nodes)
558    + Modular Policy Engine       (controlling resource placement)
559    + Local Resource Manager      (policy free, not cluster aware)
560    + Stonith Daemon              (stand-alone fencing  subsytem)
561  + Support for OCF and LSB resource agents
562  + Support for composite resource types (groups, clones)
563  + Support for a rich set of resource location and ordering constraints
564  + Conversion tool for existing haresources
565  + Resources monitored by request
566  + Resource "maintenance" mode
567  + Several failback, failure and "No Quorum" behaviours to choose from
568        (global defaults and per action or resource)
569  + Sample cluster state and configuration monitoring tools
570
571  Known issues in 2.0.0:
572    - Under some rare circumstances the cluster manager will time out
573      while stabilizing a new cluster state.  This appears to be
574        otherwise harmless - the cluster is actually fine.
575        http://www.osdl.org/developer_bugzilla/show_bug.cgi?id=770
576    - Under some rare circumstances, a dev assert will be triggered
577        in unpack.c.  This results in the pengine getting restarted.
578        This is annoying, but not a disaster.
579        http://www.osdl.org/developer_bugzilla/show_bug.cgi?id=797
580
581* Tue May 23 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
582+ Version 1.99.5 - Near-final beta of 2.0.0 release
583  + many bug fixes - code looks very stable at this point
584    -- well tested at this point on 4 and 8 node clusters.
585
586* Thu Apr 07 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
587+ Version 1.99.4 - Near-final beta of 2.0.0 release
588  + many bug fixes since 1.99.1
589  + new external STONITH model - fully supports scripting interface
590  + tested through 12 node clusters successfully
591  + No serious defects found in testing
592  + Easier-to-understand locational constraints model
593  + Many bug fixes of many kinds
594  + Important bug fixes to OCF IPaddr resource agent
595  + Resources are monitored only on request
596  + See http://wiki.linux-ha.org/ClusterResourceManager/Setup
597    for basic ideas about getting started.
598  + Release 1 style (2-node) clusters still fully supported
599  + Release 2 style clusters support 1-N node clusters
600        (where N is probably something like 8-32)
601
602* Tue Mar 20 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
603+ Version 1.99.3 - Near-final beta "technology preview" of 2.0.0 release
604  + many bug fixes since 1.99.1
605  + tested through 12 node clusters with reasonable success
606  + new STONITH API
607
608* Sun Feb 20 2005  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
609+ Version 1.99.2 - Near-final beta "technology preview" of 2.0.0 release
610  + Many many many changes.  Far too many to describe here.
611  + See http://wiki.linux-ha.org/ClusterResourceManager/Setup
612    for certain basic ideas about getting started.
613
614* Mon Oct 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
615+ Version 1.99.1 - *early* beta series - preparing for 2.0.0
616  + Andrew provided a number of fixes to the CRM and 2.0 features
617  + Fixed a problem with retrying failed STONITH operations
618
619* Mon Oct 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
620+ Version 1.99.0 - *early* beta series - preparing for 2.0.0
621  + All STABLE changes noted below have been ported to this branch
622  + Included in this release is a beta of the next generation of Heartbeat
623        resource manager developed by Andrew Beekhof. 
624        http://linuxha.trick.ca/NewHeartbeatDesign is a good place to learn
625        more about this effort. Please examine crm/README, crm/test/README
626        and crm/crm-1.0.dtd for example usage and configuration.
627  + Also included is the L(ocal) R(esource) M(anager) developed by IBM China
628        which is an integral part of the NewHeartbeatDesign.
629  + Known caveats:
630    - STONITH as a whole has seen a code cleanup and should be tested
631      carefully.
632    - The external STONITH plug-in has undergone major surgery and
633      probably doesn't work yet.
634    - the new CRM is not perfectly stable with 3 nodes yet.
635  + PLEASE see http://osdl.org/developer_bugzilla/enter_bug.cgi?product=Linux-HA
636    and use it to report quirks and issues you find!
637 
638* Sat Sep 18 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
639+ Version 1.2.3 (stable)
640  + fixed a serious error which causes heartbeat to misbehave after about
641        10 months of continuous operation
642  + Made our ARP packets more RFC compliant
643  + Extended apcmastersnmp code to deal with new devices
644  + fixed a bug concerning simultaneous stops of both machines causing one
645        of them to not shut down.
646  + added an option to suppress reporting on packet corruption
647  + fixed it so that we don't create the FIFO by the RPM
648  + made cl_status setgid so anyone can run it, and fixed exit codes
649  + eliminated a serious memory leak associated with client code
650  + packaged doc files which had been missed before
651  + fixed many many small bugs and memory leaks detected by BEAM
652  + added several new test cases
653  + fixed longstanding bug in plugin unloading
654  + fixed a shutdown hang problem
655  + several fixes for Solaris, FreeBSD
656  + Solaris packaging now included in base
657  + fixed a bug related to the apache resource agent not handling
658        quoted parameters
659  + added use_apphbd parameter to have heartbeat register
660        with apphbd instead of watchdog device when desired
661  + changed apphbd to default its config file to /etc
662  + added snmp subagent code
663  + added hbaping communications plugin
664  + added external STONITH plugin
665  + ldirectord: fixed a bug where real servers that were are
666        present in multiple virtual services will only be added
667        to one virtual service.
668
669* Mon May 11 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
670+ Version 1.2.2 (stable)
671  + Fixed several format string errors in communication plugins
672  + Fixed a bug which kept us from diagnosing errors in non-aliased interfaces
673  + Fixed a bug in ipaddr which caused an infinite loop when auto_failback on
674  + Updated Debian things...
675  + Added IPv6addr resource agent
676  + Added ibmhmc STONITH plugin
677  + Added cl_status command
678  + Fixed a bug regarding restarts when auto_failback is on...
679  + Fixed a couple of bugs in sha1 authentication method for very long keys
680  + Fixed a bug in the portblock resource agent so that it no longer blocks
681          ports on the loopback interface
682  + Increased the time allowed for split brain test before it declares failure
683
684+ Version 1.2.1 (stable)
685  + Netstrings can now be used for our on-the-wire data format
686  + Perl/SWIG bindings added for some heartbeat libraries
687  + Significant improvements to SAF data checkpointing API
688  + Implemented unbuffered ipcsocket code for SAF APIs
689  + Many Solaris fixes -- except for ipfail, Solaris works
690  + Significant library restructuring
691  + Watchdog device NOWAYOUT is now overridded if defaulted
692  + Watchdog device now kills machine instantly after deadtime
693        instead of after one minute
694  + Hostnames should now be treated case-independently...
695  + Added new client status APIs - client_status() and cstatus_callback()
696  + Fixed bug with auto_failback and quick full restarts
697  + We now automatically reboot when resources fail to stop correctly...
698  + We now check the status of the configured STONITH device hourly...
699  + STONITH operations repeat after a 5 second delay, not immediately...
700  + Added hb_takeover command - complement to hb_standby
701  + Added documentation on how to use evlog/TCP to enable testing to
702        take place without losing messages due to UDP message forwarding
703  + Several new tests from Mi, Jun - split brain, bandwidth, failure
704        detection time.
705  + Fix to LVM resource from Harald Milz <hm@muc.de>
706  + Fixed FreeBSD authentication problems breaking ipfail
707  + Fixed .so loading on Debian
708  + Fixed false complaints about resource scripts (from Jens Schmalzing)
709  + Fixed false stop failure from LinuxSCSI  (from Jens Schmalzing <j.s@lmu.de>)
710
711
712
713* Thu Apr 15 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
714+ Version 1.3.0 - beta series
715  + Netstrings can now be used for our on-the-wire data format
716  + Perl/SWIG bindings added for some heartbeat libraries
717  + Significant improvements to SAF data checkpointing API
718  + Implemented unbuffered ipcsocket code for SAF APIs
719  + Many Solaris fixes -- except for ipfail, Solaris works
720  + Significant library restructuring
721  + Watchdog device NOWAYOUT is now overridded if defaulted
722  + Watchdog device now kills machine instantly after deadtime
723        instead of after one minute
724  + Hostnames should now be treated case-independently...
725  + Added new client status APIs - client_status() and cstatus_callback()
726  + Fixed bug with auto_failback and quick full restarts
727  + We now automatically reboot when resources fail to stop correctly...
728  + We now check the status of the configured STONITH device hourly...
729  + STONITH operations repeat after a 5 second delay, not immediately...
730  + Added hb_takeover command - complement to hb_standby
731  + Added documentation on how to use evlog/TCP to enable testing to
732        take place without losing messages due to UDP message forwarding
733  + Several new tests from Mi, Jun - split brain, bandwidth, failure
734        detection time.
735  + Fix to LVM resource from Harald Milz <hm@muc.de>
736
737* Tue Feb 16 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
738+ Version 1.2.0
739  + Replaced the nice_failback option with the auto_failback option.
740        THIS OBSOLETES THE NICE_FAILBACK OPTION. READ THE DOCS FOR HOW
741        TO UPGRADE SMOOTHLY.
742  + Added a new feature to hb_standby which allows you to give up
743          any specific category of resources:  local, foreign, or all.
744        The old behavior is "all" which is the default.
745        This allows you to put a auto_failback no cluster into
746          an active/active configuration on demand.
747  + ipfail now works properly with auto_failback on (active/active)
748  + ipfail now has "hysteresis" so that it doesn't respond immediately
749        to a network failure, but waits a little while so that the
750        damage can be properly assessed and extraneous takeovers avoided
751  + Added new ping node timeout directive "deadping"
752  + Made sure heartbeat preallocated stack and heap, and printed a
753        message if we allocate heap once we're started up...
754  + IPMILan STONITH plugin added to CVS
755  + Added IPaddr2 resource script
756  + Made the APC smart UPS ups code compatible with more UPSes
757  + Added a (preliminary?) ordered messaging facility from Yi Zhu
758  + Changed IPaddr's method of doing ARPs in background so that
759        certain timing windows were closed.
760  + Added OCF (wrapper) resource script
761  + Allow respawn programs to take arguments
762  + Added pinggroups (where any node being up is OK)
763  + SIGNIFICANT amount of internal rearchitecture.
764  + Many bug fixes.
765  + Several documentation updates.
766
767* Tue Feb 10 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
768+ Version 1.1.5
769  + ipfail now has "hysteresis" so that it doesn't respond immediately
770        to a network failure, but waits a little while so that the
771        damage can be properly assessed and extraneous takeovers avoided
772  + Several fixes to cl_poll()
773  + More fixes to the IPC code - especially handling data reception
774        after EOF
775  + removed some unclean code from GSource for treating EOF conditions
776  + Several bugs concerning hanging when shutting down early during startup
777  + A few BasicSanityCheck bug fixes
778  + CTS now allows a single machine to be able to monitor several clusters
779  + Most former CTS options are now either unneeded or on the command line
780  + Increased number of ARPs and how long they're being sent out
781  + Fixed uncommon (authorization) memory leak
782  + Some Solaris portability fixes.
783  + Made init script handle standby correctly for new config files
784  + Improved the fast failure detection test
785  + Added some backwards compatibility for nice_failback and some default
786        authentication directives
787  + Corrected the 1.1.4 change log
788 
789
790* Fri Jan 22 2004  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
791+ Version 1.1.4
792  + ipfail now works properly with auto_failback on (active/active)
793  + Changed the API to use sockets (IPC library) instead of FIFOs.
794  + Added new apiauth directives to provide authorization information
795        formerly provided by the FIFO permissions.
796  + Added Intel's implementation of the SAF data checkpointing API and daemon
797  + Added a cleanup suggested by Emily Ratliff.
798  + IPMILan STONITH plugin added to CVS
799  + Added IPaddr2 resource script
800  + Various cleanups due to horms.
801  + Fixed authentication to work on 64-bit platforms(!)
802  + Fixed the cl_poll() code to handle corner cases better
803  + Made heartbeat close watchdog device before re-execing itself
804  + New CTS improvements from Mi, Jun <jun.mi@intel.com>
805  + Various minor bug fixes.
806      . Several shutdown bugs addressed
807      . fixed sendarp to make a pid file, so we can shut it down
808          when we shut everything else down in case it's still running.
809      . Lots of minor bug fixes to IPC code
810      . Lots of minor bug fixes to ipctest program
811      . made BasicSanityCheck more tolerant of delays
812      . Fixed IPC code to authenticate based on ints, not int*s.
813      . Check properly for strnlen instead of strlen...
814      . Several signed/unsigned fixes
815      . A few uninitialized vars now are inited
816      . Switched to compiling lex/yacc sources the automake way
817      . Lots of minor CTS fixes...
818
819  + ldirectord bug fixes:
820    . When new real servers are added on initialisation or when
821        the configuration file is reread they are marked with status
822        of -1 (uninitialised) so they will be checked and inserted
823        into the virtual service as required
824    . All checks use the checkport if set, otherwise the port set for
825        the individual real server. This was the case for http and
826        connect checks, but others had variations on this theme.
827    . When the configuration file is reread because it changed
828        on disk and autoreload is set, check the real servers
829        immediately rather than waiting for checkinterval to expire
830    . Already running message sent to stderr instead of stdout
831    . Support alternate server in real-server specific URL
832    . Treat the same real server with different weights as a different
833        real server. Fixes bug reported by Philip Hayward whereby the same
834        real-server would always have the same weight, regardless of
835        the ldirectord.cf
836
837* Fri Sep 26 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
838+ Version 1.1.3
839  + Bugfix for heartbeat starting resources twice concurrently if
840    auto_failback was set to "legacy".
841  + Bugfix for messages getting lost if messages were sent in quick
842    succession. (Kurosawa Takahiro)
843  + Bugfix for Filesystem resource checking for presence of filesystem
844    support before loading the module.
845  + BasicSanityCheck extended to cover more basic tests.
846  + Bugfix for findif not working correctly for CIDR netmasks.
847  + Minor bugfix for ldirectord recognizing new schedulers correctly and
848    timeout settings are now being honoured.
849  + Enhanced the message giving a better explanation of how to set up node
850    names properly when current node not found in the ha.cf file
851  + Send a message to the cluster whenever we have a node which doesn't
852    need STONITHing - even though it's gone down.  This fix needed
853    by CCM, which is in turn needed by EVMS.
854  + Enhanced the messages for missing ha.cf and missing haresources files
855    explaining that sample config files are found in the documentation.
856  + Fix for memory leak from Forrest Zhao<forrest.zhao@intel.com>
857  + Added a (preliminary?) ordered messaging facility from Yi Zhu
858  + FAQ updates
859  + Added Xinetd resource script
860  + Added OCF (wrapper) resource script
861  + Allow respawn programs to take arguments
862  + Added pinggroups (where any node being up is OK)
863  + fixed ldirectord negotiatetimeout for HTTP
864  + fixed a bug which caused -d flag to be ignored
865  + failing resource scripts are now ERRORs not WARNings
866  + now shuts down correctly when auto_failback == legacy
867
868
869* Mon Jul 13 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
870+ Version 1.1.2
871  + Replaced the nice_failback option with the auto_failback option.
872        THIS OBSOLETES THE NICE_FAILBACK OPTION. READ THE DOCS FOR HOW
873        TO UPGRADE SMOOTHLY.
874  + Changed IPaddr to not do ARPs in background, and shortened time
875        between ARPs.  Also made these things tunable...
876  + changed our comm ttys to not become our controlling TTYs
877  + Enhanced the ServeRAID script to fix a critical bug by using a new feature
878  + Added a new DirectoryMap to CVS - tells where everything is...
879  + significantly enhanced the BasicSanityCheck script, and the tests
880        it calls.
881  + added a new option to use a replacement poll function for improved
882        real-time performance.
883  + added the ability to have a cluster node's name be different
884        from it's uname -n
885  + Moved where CTS gets installed to /usr/lib/heartbeat/cts
886  + Big improvements to the CTS README from IBM test labs in Austin.
887  + bug fixes to the WTI NPS power switch
888  + new client API calls:
889        return arbitrary configuration parameters
890        return current resource status
891  + Added a new clplumbing function: mssleep()
892  + added new capabilities for supporting pseudo-resources
893  + added new messages which come out after initial takeover is done
894         (improves CTS results)
895  + LOTS of documentation updates.
896  + fixed a security vulnerability
897  + fixed a bug where heartbeat would shut down while in the middle
898        of processing resource movement requests.
899  + changed compilation flags to eliminate similar future security
900        issues
901  + went to even-more-strict gcc flags
902  + fixed several "reload" bugs.  Now reload works ;-)
903  + fixed STONITH bug when other node never heard from.
904  + Minor bug fixes (cleaned up corrupted message)
905  + Two different client API bugs fixed.
906  + changed the configure script to test which warning flags are
907        supported by the current gcc.
908  + enhanced the API test program to test new capabilities...
909
910
911* Wed May 21 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
912+ Version 1.1.1
913  + Significant restructuring of the processes in heartbeat
914  + Added a new feature to hb_standby which allows you to give up
915          any specific category of resources:  local, foreign, or all.
916        The old behavior is "all" which is the default.
917        This allows you to put a nice_failback cluster into
918          an active/active configuration
919  + Enhancements to the ServeRAID code to make it work with the new
920    (supported) version of IPSSEND from the ServeRAID folks...
921  + Added STONITH code for the Dell remote access controller
922  + Fixed a major bug which kept it from taking over correctly after 246
923        days or so
924  + Fixed a major bug where heartbeat didn't lock itself into memory
925        properly
926  + Added new ping node timeout directive "deadping"
927  + Made sure heartbeat preallocated stack and heap, and printed a
928        message if we allocate heap once we're started up...
929  + Minor heartbeat API bug fixes
930  + Minor documentation fixes
931  + Minor fix to allow IP addresses with /32 masks...
932  + Fixed a timing window for !nice_failback resource acquisition
933  + Added several CCM bug fixes
934  + Made the APC smart UPS ups code compatible with more UPSes
935  + Fixed a bug in respawn
936  + Enhanced internal checking for malloc errors...
937  + Added IP alias search optimization from Sean Reifscheneider
938
939* Wed Mar 19 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
940+ Version 1.0.2:
941  + Fixed comment errors in heartbeat init script to allow it to run on RH 8.0
942  + Changed apphbd to use poll(2) instead of sigtimedwait(2)
943  + Put missing files into tarball
944  + Documentation improvements for IPaddr and other things
945  + Fixed an error in hb_standby which kept it from working if releasing
946    resources takes more than 10 seconds
947  + Added a fix to allow heartbeat to run on systems without writable disk
948    (like routers booting from CD-ROM)
949  + Added configuration file for apphbd
950  + Added fix from Adam Li to keep recoverymgr stop looping at high priority
951  + Added fix to ServeRAID resource to make it work with (new) supported
952    hardware
953  + Added Delay resource script
954  + Added fix to Filesystem to allow it to support NFS mounts and allow
955    user to specify mount options
956  + Added fix to IPaddr to make tmp directory for restoring loopback device
957  + Added fix to ipcsocket code to deal correctly with EAGAIN when sending
958    message body
959
960* Mon Feb 17 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
961+ Version 1.0.1:
962  + Fixed some compile errors on different platforms, and library versions
963  + Disable ccm from running on 'ping' nodes
964  + Put in Steve Snodgrass' fix to send_arp to make it work on non-primary
965        interfaces.
966
967* Thu Feb 13 2003  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
968+ Version 1.0.1 beta series
969
970  0.4.9g:
971  + Changed default deadtime, warntime, and heartbeat interval
972  + Auto* tool updates
973  + VIP loopback fixes for IP address takeover
974  + Various Solaris and FreeBSD fixes
975  + added SNMP agent
976  + Several CCM bug fixes
977  + two new heartbeat API calls
978  + various documentation fixes, including documentation for ipfail
979  + Numerous minor cleanups.
980  + Fixed a few bugs in the IPC code.
981  + Fixed the (IPC) bug which caused apphbd to hang the whole machine.
982  + Added a new IPC call (waitout)
983  + Wrote a simple IPC test program.
984  + Clarified several log messages.
985  + Cleaned up the ucast communications plugin
986  + Cleaned up for new C compilers
987  + Fixed permissions bug in IPC which caused apphbd to not be usable by all
988  + Added a new rtprio option to the heartbeat config file
989  + updated apphbtest program
990  + Changed ipfail to log things at same level heartbeat does
991
992
993* Sat Nov 30 2002  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
994+ Version 0.5 beta series (now renamed to 1.0.1 beta series).
995  0.4.9f:
996  + Added pre-start, pre-stop, post-stop and pre-stop constructs in init script
997  + various IPC fixes
998  + Fix to STONITH behavior: STONITH unresponsive node right after we reboot
999  + Fixed extreme latency in IPC code
1000  + various configure.in cleanups
1001  + Fixed memory leak in IPC socket code
1002  + Added streamlined mainloop/IPC integration code
1003  + Moved more heartbeat internal communication to IPC library
1004  + Added further support for ipfail
1005  + Added supplementary groups to the respawn-ed clients
1006  + Added standby to init script actions
1007  + Lots of minor CCM fixes
1008  + Split (most) resource management code into a separate file.
1009  + Fixes to accommodate different versions of libraries
1010  + Heartbeat API client headers fixup
1011  + Added new API calls
1012  + Simplified (and fixed) handling of local status.  This would sometimes cause
1013        obscure failures on startup.
1014  + Added new IPsrcaddr resource script
1015
1016  KNOWN BUGS:
1017  + apphbd goes into an infinite loop on some platforms
1018
1019* Wed Oct 9 2002  Alan Robertson <alanr@unix.sh> (see doc/AUTHORS file)
1020  0.4.9e:
1021  + Changed client code to keep write file descriptor open at all times
1022        (realtime improvement)
1023  + Added a "poll replacement"  function based on sigtimedwait(2), which
1024        should be faster for those cases that can use it.
1025  + Added a hb_warntime() call to the application heartbeat API.
1026  + Changed all times in the configuration file to be in milliseconds
1027        if specified with "ms" at the end.  (seconds is still the default).
1028  + Fixes to serious security issue due to Nathan Wallwork <nwallwo@pnm.com>
1029  + Changed read/write child processes to run as nobody.
1030  + Fixed a bug where ping packets are printed incorrectly when debugging.
1031  + Changed heartbeat code to preallocate a some heap space.
1032  + CCM daemon API restructuring
1033  + Added ipc_channel_pair() function to the IPC library.
1034  + Changed everything to use longclock_t instead of clock_t
1035  + Fixed a bug concerning the ifwalk() call on ping nodes in the API
1036  + Made apphbd run at high priority and locked into memory
1037  + Made a library for setting priority up.
1038  + Made ucast comm module at least be configurable and loadable.
1039  + Fixed a startup/shutdown timing problem.
1040
1041  0.4.9d:
1042  + removed an "open" call for /proc/loadavg (improve realtime behavior)
1043  + changed API code to not 1-char reads from clients
1044  + Ignored certain error conditions from API clients
1045  + fixed an obscure error message about trying to retransmit a packet
1046        which we haven't sent yet.  This happens after restarts.
1047  + made the PILS libraries available in a separate package
1048  + moved the stonith headers to stonith/... when installed
1049  + improved debugging for NV failure cases...
1050  + updated AUTHORS file and simplified the changelog authorship
1051        (look in AUTHORS for the real story)
1052  + Added Ram Pai's CCM membership code
1053  + Added the application heartbeat code
1054  + Added the Kevin Dwyer's ipfail client code to the distribution
1055  + Many fixes for various tool versions and OS combinations.
1056  + Fixed a few bugs related to clients disconnecting.
1057  + Fixed some bugs in the CTS test code.
1058  + Added BasicSanityCheck script to tell if built objects look good.
1059  + Added PATH-like capabilities to PILS
1060  + Changed STONITH to use the new plugin system.
1061  + *Significantly* improved STONITH usage message (from Lorn Kay)
1062  + Fixed some bugs related to restarting.
1063  + Made exit codes more LSB-compliant.
1064  + Fixed various things so that ping nodes don't break takeovers.
1065
1066  0.4.9c and before:
1067  + Cluster partitioning  now handled correctly (really!)
1068  + Complete rearchitecture of plugin system
1069  + Complete restructure of build system to use automake and port things
1070        to AIX, FreeBSD and solaris.
1071  + Added Lclaudio's "standby" capability to put a node into standby
1072        mode on demand.
1073  + Added code to send out gratuitous ARP requests as well as gratuitous
1074        arp replies during IP address takeover.
1075  + Suppress stonith operations for nodes which went down gracefully.
1076  + Significantly improved real-time performance
1077  + Added new unicast heartbeat type.
1078  + Added code to make serial ports flush stale data on new connections.
1079  + The Famous CLK_TCK compile time fixes (really!)
1080  + Added a document which describes the heartbeat API
1081  + Changed the code which makes FIFOs to not try and make the FIFOs for
1082        named clients, and several other minor API client changes.
1083  + Fixed a fairly rare client API bug where it would shut down the
1084        client for no apparent reason.
1085  + Added stonith plugins for: apcmaster, apcmastersnmp switches, and ssh
1086        module (for test environments only)
1087  + Integrated support for the Baytech RPC-3 switch into baytech module
1088  + Fixes to APC UPS plugin
1089  + Got rid of "control_process: NULL message" message
1090  + Got rid of the "controlfifo2msg: cannot create message" message
1091  + Added -h option to give usage message for stonith command...
1092  + Wait for successful STONITH completion, and retry if its configured.
1093  + Sped up takeover code.
1094  + Several potential timing problems eliminated.
1095  + Cleaned up the shutdown (exit) code considerably.
1096  + Detect the death of our core child processes.
1097  + Changed where usage messages go depending on exit status from usage().
1098  + Made some more functions static.
1099  + Real-time performance improvement changes
1100  + Updated the faqntips document
1101  + Added a feature to heartbeat.h so that log messages get checked as
1102        printf-style messages on GNU C compilers
1103  + Changed several log messages to have the right parameters (discovered
1104        as a result of the change above)
1105  + Numerous FreeBSD, Solaris and OpenBSD fixes.
1106  + Added backwards compatibility kludge for udp (versus bcast)
1107  + Queued messages to API clients instead of throwing them away.
1108  + Added code to send out messages when clients join, leave.
1109  + Added support for spawning and monitoring child clients.
1110  + Cleaned up error messages.
1111  + Added support for DB2, ServeRAID and WAS, LVM, and Apache (IBMhttp too),
1112    also ICP Vortex controller.
1113  + Added locking when creating new IP aliases.
1114  + Added a "unicast" media option.
1115  + Added a new SimulStart and standby test case.
1116  + Diddled init levels around...
1117  + Added an application-level heartbeat API.
1118  + Added several new "plumbing" subsystems (IPC, longclock_t, proctrack, etc.)
1119  + Added a new "contrib" directory.
1120  + Fixed serious (but trivial) bug in the process tracking code which caused
1121        it to exit heartbeat - this occured repeatably for STONITH operations.
1122  + Write a 'v' to the watchdog device to tell it not to reboot us when
1123        we close the device.
1124  + Various ldirectord fixes due to Horms
1125  + Minor patch from Lorn Kay to deal with loopback interfaces which might
1126        have been put in by LVS direct routing
1127  + Updated AUTHORS file and moved list of authors over
1128
1129* Fri Mar 16 2001  Alan Robertson <alanr@unix.sh>
1130+ Version 0.4.9
1131
1132  + Split into 3 rpms - heartbeat, heartbeat-stonith heartbeat-ldirectord
1133
1134  + Made media modules and authentication modules and stonith modules
1135        dynamically loadable.
1136
1137  + Added Multicast media support
1138  + Added ping node/membership/link type for tiebreaking.  This will
1139        be useful when implementing quorum on 2-node systems.
1140        (not yet compatible with nice_failback(?))
1141  + Removed ppp support
1142
1143  + Heartbeat client API support
1144
1145  + Added STONITH API library
1146    +   support for the Baytech RPC-3A power switch
1147    +   support for the APCsmart UPS
1148    +   support for the VACM cluster management tool
1149    +   support for WTI RPS10
1150    +   support for Night/Ware RPC100S
1151    +   support for "Meatware" (human intervention) module
1152    +   support for "null" (testing only) module
1153
1154  + Fixed startup timing bugs
1155  + Fixed shutdown sequence bugs: takeover occured before
1156        resources were released by other system
1157  + Fixed various logging bugs
1158  + Closed holes in protection against replay attacks
1159
1160  + Added checks that complain if all resources aren't idle on startup.
1161  + IP address takeover fixes
1162      + Endian fixes
1163      + Removed the 8-alias limitation
1164      + Takeovers now occur faster (ARPs occur asynchronously)
1165
1166  + Port number changes
1167    + Use our IANA port number (694) by default
1168    + Recognize our IANA port number ("ha-cluster") if it's in /etc/services
1169
1170  + Moved several files, etc. from /var/run to /var/lib/heartbeat
1171  + Incorporated new ldirectord version
1172  + Added late heartbeat warning for late-arriving heartbeats
1173  + Added detection of and partial recovery from cluster partitions
1174  + Accept multiple arguments for resource scripts
1175  + Added Raid1 and Filesystem resource scripts
1176  + Added man pages
1177  + Added debian package support
1178
1179* Fri Jun 30 2000 Alan Robertson <alanr@unix.sh>
1180+ Version 0.4.8
1181  + Incorporated ldirectord version 1.9 (fixes memory leak)
1182  + Made the order of resource takeover more rational:  Takeover is now
1183    left-to-right, and giveup is right-to-left
1184  + Changed the default port number to our official IANA port number (694)
1185  + Regularized more messages, eliminated some redundant ones.
1186  + Print the version of heartbeat when starting.
1187  + Print exhaustive version info when starting with debug on.
1188  + Hosts now have 3 statuses {down, up, active} active means that it knows
1189        that all its links are operational, and it's safe to send cluster
1190        messages
1191  + Significant revisions to nice_failback (mainly due to lclaudio)
1192  + More SuSE-compatibility. Thanks to Friedrich Lobenstock <fl@fl.priv.at>
1193  + Tidied up logging so it can be to files, to syslog or both (Horms)
1194  + Tidied up build process (Horms)
1195  + Updated ldirectord to produce and install a man page and be
1196    compatible with the fwmark options to The Linux Virtual Server (Horms)
1197  + Added log rotation for ldirectord and heartbeat using logrotate
1198    if it is installed
1199  + Added Audible Alarm resource by Kirk Lawson <lklawson@heapy.com>
1200    and myself (Horms)
1201  + Added init script for ldirectord so it can be run independently
1202    of heartbeat (Horms)
1203  + Added sample config file for ldirectord (Horms)
1204  + An empty /etc/ha.d/conf/ is now part of the rpm distribution
1205    as this is where ldirectord's configuration belongs (Horms)
1206  + Minor startup script tweaks.  Hopefully, we should be able to make core
1207    files should we crash in the future.  Thanks to Holger Kiehl for diagnosing
1208    the problem!
1209  + Fixed a bug which kept the "logfile" option from ever working.
1210  + Added a TestCluster test utility.  Pretty primitive so far...
1211  + Fixed the serial locking code so that it unlocks when it shuts down.
1212  + Lock heartbeat into memory, and raise our priority
1213  + Minor, but important fix from lclaudio to init uninited variable.
1214
1215* Sat Dec 25 1999 Alan Robertson <alanr@unix.sh>
1216+ Version 0.4.7
1217  + Added the nice_failback feature. If the cluster is running when
1218        the primary starts it acts as a secondary. (Luis Claudio Goncalves)
1219  + Put in lots of code to make lost packet retransmission happen
1220  + Stopped trying to use the /proc/ha interface
1221  + Finished the error recovery in the heartbeat protocol (and got it to work)
1222  + Added test code for the heartbeat protocol
1223  + Raised the maximum length of a node name
1224  + Added Jacob Rief's ldirectord resource type
1225  + Added Stefan Salzer's <salt@cin.de> fix for a 'grep' in IPaddr which
1226        wasn't specific enough and would sometimes get IPaddr confused on
1227        IP addresses that prefix-matched.
1228  + Added Lars Marowsky-Bree's suggestion to make the code almost completely
1229        robust with respect to jumping the clock backwards and forwards
1230  + Added code from Michael Moerz <mike@cubit.at> to keep findif from
1231        core dumping if /proc/route can't be read.
1232
1233* Mon Nov 22 1999 Alan Robertson <alanr@unix.sh>
1234+ Version 0.4.6
1235  + Fixed timing problem in "heartbeat restart" so it's reliable now
1236  + Made start/stop status compatible with SuSE expectations
1237  + Made resource status detection compatible with SuSE start/stop expectations
1238  + Fixed a bug relating to serial and ppp-udp authentication (it never worked)
1239  + added a little more substance to the error recovery for the HB protocol.
1240  + Fixed a bug for logging from shell scripts
1241  + Added a little logging for initial resource acquisition
1242  + Added #!/bin/sh to the front of shell scripts
1243  + Fixed Makefile, so that the build root wasn't compiled into pathnames
1244  + Turned on CTSRTS, enabling for flow control for serial ports.
1245  + Fixed a bug which kept it from working in non-English environments
1246
1247* Wed Oct 13 1999 Alan Robertson <alanr@unix.sh>
1248+ Version 0.4.5
1249  + Mijta Sarp added a new feature to authenticate heartbeat packets
1250        using a variety of strong authentication techniques
1251  + Changed resource acquisition and relinquishment to occur in heartbeat,
1252       instead of in the start/stop script.  This means you don't *really*
1253       have to use the start/stop script if you don't want to.
1254  + Added -k option to gracefully shut down current heartbeat instance
1255  + Added -r option to cause currently running heartbeat to reread config files
1256  + Added -s option to report on operational status of "heartbeat"
1257  + Sped up resource acquisition on master restart.
1258  + Added validation of ipresources file at startup time.
1259  + Added code to allow the IPaddr takeover script to be given the
1260        interface to take over, instead of inferring it.  This was requested
1261        by Lars Marowsky-Bree
1262  + Incorporated patch from Guenther Thomsen to implement locking for
1263        serial ports used for heartbeats
1264  + Incorporated patch from Guenther Thomsen to clean up logging.
1265        (you can now use syslog and/or file logs)
1266  + Improved FreeBSD compatibility.
1267  + Fixed a bug where the FIFO doesn't get created correctly.
1268  + Fixed a couple of uninitialized variables in heartbeat and /proc/ha code
1269  + Fixed longstanding crash bug related to getting a SIGALRM while in malloc
1270        or free.
1271  + Implemented new memory management scheme, including memory stats
1272
1273* Thu Sep 16 1999 Alan Robertson <alanr@unix.sh>
1274+ Version 0.4.4
1275  + Fixed a stupid error in handling CIDR addresses in IPaddr.
1276  + Updated the documentation with the latest from Rudy.
1277
1278* Wed Sep 15 1999 Alan Robertson <alanr@unix.sh>
1279+ Version 0.4.3
1280  + Changed startup scripts to create /dev/watchdog if needed
1281  + Turned off loading of /proc/ha module by default.
1282  + Incorporated bug fix from Thomas Hepper <th@ant.han.de> to IPaddr for
1283        PPP configurations
1284  + Put in a fix from Gregor Howey <ghowey@bremer-nachrichten.de>
1285        where Gregor found that I had stripped off the ::resourceid part
1286        of the string in ResourceManager resulting in some bad calls later on.
1287  +  Made it compliant with the FHS (filesystem hierarchy standard)
1288  +  Fixed IP address takeover so we can take over on non-eth0 interface
1289  +  Fixed IP takeover code so we can specify netmasks and broadcast addrs,
1290        or default them at the user's option.
1291  +  Added code to report on message buffer usage on SIGUSR[12]
1292  +  Made SIGUSR1 increment debug level, and SIGUSR2 decrement it.
1293  +  Incorporated Rudy's latest "Getting Started" document
1294  +  Made it largely Debian-compliant.  Thanks to Guenther Thomsen, Thomas
1295        Hepper, I単aki Fern叩ndez Villanueva and others.
1296  +  Made changes to work better with Red Hat 6.1, and SMP code.
1297  +  Sometimes it seems that the Master Control Process dies :-(
1298
1299* Sat Aug 14 1999 Alan Robertson <alanr@unix.sh>
1300+ Version 0.4.2
1301  + Implemented simple resource groups
1302  + Implemented application notification for groups starting/stopping
1303  + Eliminated restriction on floating IPs only being associated with eth0
1304  + Added a uniform resource model, with IP resources being only one kind.
1305        (Thanks to Lars Marowsky-Bree for a good suggestion)
1306  + Largely rewrote the IP address takeover code, making it clearer, fit
1307        into the uniform resource model, and removing some restrictions.
1308  + Preliminary "Getting Started" document by Rudy Pawul
1309  + Improved the /proc/ha code
1310  + Fixed memory leak associated with serial ports, and problem with return
1311        of control to the "master" node.
1312        (Thanks to Holger Kiehl for reporting them, and testing fixes!)
1313
1314* Tue Jul 6 1999 Alan Robertson <alanr@unix.sh>
1315+ Version 0.4.1
1316  + Fixed major memory leak in 0.4.0 (oops!)
1317  + Added code to eliminate duplicate packets and log lost ones
1318  + Tightened up PPP/UDP startup/shutdown code
1319  + Made PPP/UDP peacefully coexist with "normal" udp
1320  + Made logs more uniform and neater
1321  + Fixed several other minor bugs
1322  + Added very preliminary kernel code for monitoring and controlling
1323        heartbeat via /proc/ha.  Very cool, but not really done yet.
1324
1325* Wed Jun 30 1999 Alan Robertson <alanr@unix.sh>
1326+ Version 0.4.0
1327  + Changed packet format from single line positional parameter style
1328        to a collection of {name,value} pairs.  A vital change for the future.
1329  + Fixed some bugs with regard to forwarding data around rings
1330  + We now modify /etc/ppp/ip-up.local, so PPP-udp works out of the box
1331        (at least for Red Hat)
1332  + Includes the first version of Volker Wiegand's Hardware Installation Guide
1333        (it's pretty good for a first version!)
1334
1335* Wed Jun 09 1999 Alan Robertson <alanr@unix.sh>
1336+ Version 0.3.2
1337  + Added UDP/PPP bidirectional serial ring heartbeat
1338        (PPP ensures data integrity on the serial links)
1339  + fixed a stupid bug which caused shutdown to give unpredictable
1340        results
1341  + added timestamps to /var/log/ha-log messages
1342  + fixed a couple of other minor oversights.
1343
1344* Sun May 10 1999  Alan Robertson <alanr@unix.sh>
1345+ Version 0.3.1
1346  + Make ChangeLog file from RPM specfile
1347  + Made ipresources only install in the DOC directory as a sample
1348
1349* Sun May 09 1999 Alan Robertson <alanr@unix.sh>
1350+ Version 0.3.0
1351  + Added UDP broadcast heartbeat (courtesy of Tom Vogt)
1352  + Significantly restructured code making it easier to add heartbeat media
1353  + added new directives to config file:
1354    + udp interface-name
1355    + udpport port-number
1356    + baud    serial-baud-rate
1357  + made manual daemon shutdown easier (only need to kill one)
1358  + moved the sample ha.cf file to the Doc directory
1359
1360* Sat Mar 27 1999 Alan Robertson <alanr@unix.sh>
1361+ Version 0.2.0
1362  + Make an RPM out of it
1363  + Integrated IP address takeover gotten from Horms
1364  + Added support to tickle a watchdog timer whenever our heart beats
1365  + Integrated enough basic code to allow a 2-node demo to occur
1366  + Integrated patches from Andrew Hildebrand <andrew@pdi.com> to allow it
1367    to run under IRIX.
1368  - Known Bugs
1369    - Only supports 2-node clusters
1370    - Only supports a single IP interface per node in the cluster
1371    - Doesn't yet include Tom Vogt's ethernet heartbeat code
1372    - No documentation
1373    - Not very useful yet :-)
1374
1375###########################################################
Note: See TracBrowser for help on using the repository browser.