diff --git a/case-study-porting-chardet-to-python-3.html b/case-study-porting-chardet-to-python-3.html
index 715fdbb..1d78229 100644
--- a/case-study-porting-chardet-to-python-3.html
+++ b/case-study-porting-chardet-to-python-3.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Case study: porting chardet to Python 3 - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
@@ -42,6 +43,8 @@ body{counter-reset:h1 20}
   <li><a href=#namefileisnotdefined>Name '<var>file</var>' is not defined</a>
   <li><a href=#cantuseastringpattern>Can&#8217;t use a string pattern on a bytes-like object</a>
   <li><a href=#cantconvertbytesobject>Can&#8217;t convert '<code>bytes</code>' object to <code>str</code> implicitly</a>
+  <li><a href=#unsupportedoperandtypeforplus>TypeError: unsupported operand type(s) for +: 'int' and 'bytes'</a>
+  <li><a href=#ordexpectedstring>TypeError: ord() expected string of length 1, but int found</a>
   </ol>
 </ol>
 <h2 id=divingin>Introducing <code class=filename>chardet</code>: a mini-<abbr>FAQ</abbr></h2>
@@ -111,8 +114,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  __version__ = "1.0.1"
 
  def detect(aBuf):
--    import universaldetector
-+    from . import universaldetector
+<del>-    import universaldetector</del>
+<ins>+    from . import universaldetector</ins>
      u = universaldetector.UniversalDetector()
      u.reset()
      u.feed(aBuf)
@@ -122,14 +125,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import Big5DistributionAnalysis
--from mbcssm import Big5SMModel
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import Big5DistributionAnalysis
-+from .mbcssm import Big5SMModel
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import Big5DistributionAnalysis</del>
+<del>-from mbcssm import Big5SMModel</del>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import Big5DistributionAnalysis</ins>
+<ins>+from .mbcssm import Big5SMModel</ins>
 
  class Big5Prober(MultiByteCharSetProber):
      def __init__(self):
@@ -139,18 +142,18 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
--from euctwfreq import EUCTWCharToFreqOrder, EUCTW_TABLE_SIZE, EUCTW_TYPICAL_DISTRIBUTION_RATIO
--from euckrfreq import EUCKRCharToFreqOrder, EUCKR_TABLE_SIZE, EUCKR_TYPICAL_DISTRIBUTION_RATIO
--from gb2312freq import GB2312CharToFreqOrder, GB2312_TABLE_SIZE, GB2312_TYPICAL_DISTRIBUTION_RATIO
--from big5freq import Big5CharToFreqOrder, BIG5_TABLE_SIZE, BIG5_TYPICAL_DISTRIBUTION_RATIO
--from jisfreq import JISCharToFreqOrder, JIS_TABLE_SIZE, JIS_TYPICAL_DISTRIBUTION_RATIO
-+from . import constants
-+from .euctwfreq import EUCTWCharToFreqOrder, EUCTW_TABLE_SIZE, EUCTW_TYPICAL_DISTRIBUTION_RATIO
-+from .euckrfreq import EUCKRCharToFreqOrder, EUCKR_TABLE_SIZE, EUCKR_TYPICAL_DISTRIBUTION_RATIO
-+from .gb2312freq import GB2312CharToFreqOrder, GB2312_TABLE_SIZE, GB2312_TYPICAL_DISTRIBUTION_RATIO
-+from .big5freq import Big5CharToFreqOrder, BIG5_TABLE_SIZE, BIG5_TYPICAL_DISTRIBUTION_RATIO
-+from .jisfreq import JISCharToFreqOrder, JIS_TABLE_SIZE, JIS_TYPICAL_DISTRIBUTION_RATIO
+<del>-import constants</del>
+<del>-from euctwfreq import EUCTWCharToFreqOrder, EUCTW_TABLE_SIZE, EUCTW_TYPICAL_DISTRIBUTION_RATIO</del>
+<del>-from euckrfreq import EUCKRCharToFreqOrder, EUCKR_TABLE_SIZE, EUCKR_TYPICAL_DISTRIBUTION_RATIO</del>
+<del>-from gb2312freq import GB2312CharToFreqOrder, GB2312_TABLE_SIZE, GB2312_TYPICAL_DISTRIBUTION_RATIO</del>
+<del>-from big5freq import Big5CharToFreqOrder, BIG5_TABLE_SIZE, BIG5_TYPICAL_DISTRIBUTION_RATIO</del>
+<del>-from jisfreq import JISCharToFreqOrder, JIS_TABLE_SIZE, JIS_TYPICAL_DISTRIBUTION_RATIO</del>
+<ins>+from . import constants</ins>
+<ins>+from .euctwfreq import EUCTWCharToFreqOrder, EUCTW_TABLE_SIZE, EUCTW_TYPICAL_DISTRIBUTION_RATIO</ins>
+<ins>+from .euckrfreq import EUCKRCharToFreqOrder, EUCKR_TABLE_SIZE, EUCKR_TYPICAL_DISTRIBUTION_RATIO</ins>
+<ins>+from .gb2312freq import GB2312CharToFreqOrder, GB2312_TABLE_SIZE, GB2312_TYPICAL_DISTRIBUTION_RATIO</ins>
+<ins>+from .big5freq import Big5CharToFreqOrder, BIG5_TABLE_SIZE, BIG5_TYPICAL_DISTRIBUTION_RATIO</ins>
+<ins>+from .jisfreq import JISCharToFreqOrder, JIS_TABLE_SIZE, JIS_TYPICAL_DISTRIBUTION_RATIO</ins>
 
  ENOUGH_DATA_THRESHOLD = 1024
  SURE_YES = 0.99
@@ -160,8 +163,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from charsetprober import CharSetProber
-+from .charsetprober import CharSetProber
+<del>-from charsetprober import CharSetProber</del>
+<ins>+from .charsetprober import CharSetProber</ins>
 
  class CharSetGroupProber(CharSetProber):
      def __init__(self):
@@ -171,8 +174,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from constants import eStart, eError, eItsMe
-+from .constants import eStart, eError, eItsMe
+<del>-from constants import eStart, eError, eItsMe</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
 
  class CodingStateMachine:
      def __init__(self, sm):
@@ -182,28 +185,28 @@ RefactoringTool: Skipping implicit fixer: ws_comma
 
  SHORTCUT_THRESHOLD = 0.95
 
--import __builtin__
-+import builtins
+<del>-import __builtin__</del>
+<ins>+import builtins</ins>
  if not hasattr(__builtin__, 'False'):
      False = 0
      True = 1
  else:
--    False = __builtin__.False
--    True = __builtin__.True
-+    False = builtins.False
-+    True = builtins.True
+<del>-    False = __builtin__.False</del>
+<del>-    True = __builtin__.True</del>
+<ins>+    False = builtins.False</ins>
+<ins>+    True = builtins.True</ins>
 --- chardet\escprober.py (original)
 +++ chardet\escprober.py (refactored)
 @@ -26,9 +26,9 @@
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from escsm import HZSMModel, ISO2022CNSMModel, ISO2022JPSMModel, ISO2022KRSMModel
--from charsetprober import CharSetProber
--from codingstatemachine import CodingStateMachine
-+from .escsm import HZSMModel, ISO2022CNSMModel, ISO2022JPSMModel, ISO2022KRSMModel
-+from .charsetprober import CharSetProber
-+from .codingstatemachine import CodingStateMachine
+<del>-from escsm import HZSMModel, ISO2022CNSMModel, ISO2022JPSMModel, ISO2022KRSMModel</del>
+<del>-from charsetprober import CharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<ins>+from .escsm import HZSMModel, ISO2022CNSMModel, ISO2022JPSMModel, ISO2022KRSMModel</ins>
+<ins>+from .charsetprober import CharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
 
  class EscCharSetProber(CharSetProber):
      def __init__(self):
@@ -213,8 +216,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from constants import eStart, eError, eItsMe
-+from .constants import eStart, eError, eItsMe
+<del>-from constants import eStart, eError, eItsMe</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
 
  HZ_cls = ( \
  1,0,0,0,0,0,0,0,  # 00 - 07
@@ -224,18 +227,18 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from constants import eStart, eError, eItsMe
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import EUCJPDistributionAnalysis
--from jpcntx import EUCJPContextAnalysis
--from mbcssm import EUCJPSMModel
-+from .constants import eStart, eError, eItsMe
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import EUCJPDistributionAnalysis
-+from .jpcntx import EUCJPContextAnalysis
-+from .mbcssm import EUCJPSMModel
+<del>-from constants import eStart, eError, eItsMe</del>
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import EUCJPDistributionAnalysis</del>
+<del>-from jpcntx import EUCJPContextAnalysis</del>
+<del>-from mbcssm import EUCJPSMModel</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import EUCJPDistributionAnalysis</ins>
+<ins>+from .jpcntx import EUCJPContextAnalysis</ins>
+<ins>+from .mbcssm import EUCJPSMModel</ins>
 
  class EUCJPProber(MultiByteCharSetProber):
      def __init__(self):
@@ -245,14 +248,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import EUCKRDistributionAnalysis
--from mbcssm import EUCKRSMModel
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import EUCKRDistributionAnalysis
-+from .mbcssm import EUCKRSMModel
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import EUCKRDistributionAnalysis</del>
+<del>-from mbcssm import EUCKRSMModel</del>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import EUCKRDistributionAnalysis</ins>
+<ins>+from .mbcssm import EUCKRSMModel</ins>
 
  class EUCKRProber(MultiByteCharSetProber):
      def __init__(self):
@@ -262,14 +265,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import EUCTWDistributionAnalysis
--from mbcssm import EUCTWSMModel
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import EUCTWDistributionAnalysis
-+from .mbcssm import EUCTWSMModel
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import EUCTWDistributionAnalysis</del>
+<del>-from mbcssm import EUCTWSMModel</del>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import EUCTWDistributionAnalysis</ins>
+<ins>+from .mbcssm import EUCTWSMModel</ins>
 
  class EUCTWProber(MultiByteCharSetProber):
      def __init__(self):
@@ -279,14 +282,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import GB2312DistributionAnalysis
--from mbcssm import GB2312SMModel
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import GB2312DistributionAnalysis
-+from .mbcssm import GB2312SMModel
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import GB2312DistributionAnalysis</del>
+<del>-from mbcssm import GB2312SMModel</del>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import GB2312DistributionAnalysis</ins>
+<ins>+from .mbcssm import GB2312SMModel</ins>
 
  class GB2312Prober(MultiByteCharSetProber):
      def __init__(self):
@@ -296,10 +299,10 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from charsetprober import CharSetProber
--import constants
-+from .charsetprober import CharSetProber
-+from . import constants
+<del>-from charsetprober import CharSetProber</del>
+<del>-import constants</del>
+<ins>+from .charsetprober import CharSetProber</ins>
+<ins>+from . import constants</ins>
 
  # This prober doesn't actually recognize a language or a charset.
  # It is a helper prober for the use of the Hebrew model probers
@@ -309,8 +312,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  NUM_OF_CATEGORY = 6
  DONT_KNOW = -1
@@ -320,8 +323,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # 255: Control characters that usually does not exist in any text
  # 254: Carriage/Return
@@ -331,8 +334,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # KOI8-R language model
  # Character Mapping Table:
@@ -342,8 +345,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # 255: Control characters that usually does not exist in any text
  # 254: Carriage/Return
@@ -353,8 +356,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # 255: Control characters that usually does not exist in any text
  # 254: Carriage/Return
@@ -364,8 +367,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # 255: Control characters that usually does not exist in any text
  # 254: Carriage/Return
@@ -375,8 +378,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--import constants
-+from . import constants
+<del>-import constants</del>
+<ins>+from . import constants</ins>
 
  # 255: Control characters that usually does not exist in any text
  # 254: Carriage/Return
@@ -386,10 +389,10 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from charsetprober import CharSetProber
--import constants
-+from .charsetprober import CharSetProber
-+from . import constants
+<del>-from charsetprober import CharSetProber</del>
+<del>-import constants</del>
+<ins>+from .charsetprober import CharSetProber</ins>
+<ins>+from . import constants</ins>
  import operator
 
  FREQ_CAT_NUM = 4
@@ -399,10 +402,10 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from constants import eStart, eError, eItsMe
--from charsetprober import CharSetProber
-+from .constants import eStart, eError, eItsMe
-+from .charsetprober import CharSetProber
+<del>-from constants import eStart, eError, eItsMe</del>
+<del>-from charsetprober import CharSetProber</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
+<ins>+from .charsetprober import CharSetProber</ins>
 
  class MultiByteCharSetProber(CharSetProber):
      def __init__(self):
@@ -412,22 +415,22 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from charsetgroupprober import CharSetGroupProber
--from utf8prober import UTF8Prober
--from sjisprober import SJISProber
--from eucjpprober import EUCJPProber
--from gb2312prober import GB2312Prober
--from euckrprober import EUCKRProber
--from big5prober import Big5Prober
--from euctwprober import EUCTWProber
-+from .charsetgroupprober import CharSetGroupProber
-+from .utf8prober import UTF8Prober
-+from .sjisprober import SJISProber
-+from .eucjpprober import EUCJPProber
-+from .gb2312prober import GB2312Prober
-+from .euckrprober import EUCKRProber
-+from .big5prober import Big5Prober
-+from .euctwprober import EUCTWProber
+<del>-from charsetgroupprober import CharSetGroupProber</del>
+<del>-from utf8prober import UTF8Prober</del>
+<del>-from sjisprober import SJISProber</del>
+<del>-from eucjpprober import EUCJPProber</del>
+<del>-from gb2312prober import GB2312Prober</del>
+<del>-from euckrprober import EUCKRProber</del>
+<del>-from big5prober import Big5Prober</del>
+<del>-from euctwprober import EUCTWProber</del>
+<ins>+from .charsetgroupprober import CharSetGroupProber</ins>
+<ins>+from .utf8prober import UTF8Prober</ins>
+<ins>+from .sjisprober import SJISProber</ins>
+<ins>+from .eucjpprober import EUCJPProber</ins>
+<ins>+from .gb2312prober import GB2312Prober</ins>
+<ins>+from .euckrprober import EUCKRProber</ins>
+<ins>+from .big5prober import Big5Prober</ins>
+<ins>+from .euctwprober import EUCTWProber</ins>
 
  class MBCSGroupProber(CharSetGroupProber):
      def __init__(self):
@@ -437,8 +440,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from constants import eStart, eError, eItsMe
-+from .constants import eStart, eError, eItsMe
+<del>-from constants import eStart, eError, eItsMe</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
 
  # BIG5
 
@@ -448,8 +451,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from charsetprober import CharSetProber
-+from .charsetprober import CharSetProber
+<del>-from charsetprober import CharSetProber</del>
+<ins>+from .charsetprober import CharSetProber</ins>
 
  SAMPLE_SIZE = 64
  SB_ENOUGH_REL_THRESHOLD = 1024
@@ -459,24 +462,24 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from charsetgroupprober import CharSetGroupProber
--from sbcharsetprober import SingleByteCharSetProber
--from langcyrillicmodel import Win1251CyrillicModel, Koi8rModel, Latin5CyrillicModel, MacCyrillicModel, Ibm866Model, Ibm855Model
--from langgreekmodel import Latin7GreekModel, Win1253GreekModel
--from langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel
--from langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel
--from langthaimodel import TIS620ThaiModel
--from langhebrewmodel import Win1255HebrewModel
--from hebrewprober import HebrewProber
-+from .charsetgroupprober import CharSetGroupProber
-+from .sbcharsetprober import SingleByteCharSetProber
-+from .langcyrillicmodel import Win1251CyrillicModel, Koi8rModel, Latin5CyrillicModel, MacCyrillicModel, Ibm866Model, Ibm855Model
-+from .langgreekmodel import Latin7GreekModel, Win1253GreekModel
-+from .langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel
-+from .langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel
-+from .langthaimodel import TIS620ThaiModel
-+from .langhebrewmodel import Win1255HebrewModel
-+from .hebrewprober import HebrewProber
+<del>-from charsetgroupprober import CharSetGroupProber</del>
+<del>-from sbcharsetprober import SingleByteCharSetProber</del>
+<del>-from langcyrillicmodel import Win1251CyrillicModel, Koi8rModel, Latin5CyrillicModel, MacCyrillicModel, Ibm866Model, Ibm855Model</del>
+<del>-from langgreekmodel import Latin7GreekModel, Win1253GreekModel</del>
+<del>-from langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel</del>
+<del>-from langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel</del>
+<del>-from langthaimodel import TIS620ThaiModel</del>
+<del>-from langhebrewmodel import Win1255HebrewModel</del>
+<del>-from hebrewprober import HebrewProber</del>
+<ins>+from .charsetgroupprober import CharSetGroupProber</ins>
+<ins>+from .sbcharsetprober import SingleByteCharSetProber</ins>
+<ins>+from .langcyrillicmodel import Win1251CyrillicModel, Koi8rModel, Latin5CyrillicModel, MacCyrillicModel, Ibm866Model, Ibm855Model</ins>
+<ins>+from .langgreekmodel import Latin7GreekModel, Win1253GreekModel</ins>
+<ins>+from .langbulgarianmodel import Latin5BulgarianModel, Win1251BulgarianModel</ins>
+<ins>+from .langhungarianmodel import Latin2HungarianModel, Win1250HungarianModel</ins>
+<ins>+from .langthaimodel import TIS620ThaiModel</ins>
+<ins>+from .langhebrewmodel import Win1255HebrewModel</ins>
+<ins>+from .hebrewprober import HebrewProber</ins>
 
  class SBCSGroupProber(CharSetGroupProber):
      def __init__(self):
@@ -486,19 +489,19 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  # 02110-1301  USA
  ######################### END LICENSE BLOCK #########################
 
--from mbcharsetprober import MultiByteCharSetProber
--from codingstatemachine import CodingStateMachine
--from chardistribution import SJISDistributionAnalysis
--from jpcntx import SJISContextAnalysis
--from mbcssm import SJISSMModel
-+from .mbcharsetprober import MultiByteCharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .chardistribution import SJISDistributionAnalysis
-+from .jpcntx import SJISContextAnalysis
-+from .mbcssm import SJISSMModel
+<del>-from mbcharsetprober import MultiByteCharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from chardistribution import SJISDistributionAnalysis</del>
+<del>-from jpcntx import SJISContextAnalysis</del>
+<del>-from mbcssm import SJISSMModel</del>
+<ins>+from .mbcharsetprober import MultiByteCharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .chardistribution import SJISDistributionAnalysis</ins>
+<ins>+from .jpcntx import SJISContextAnalysis</ins>
+<ins>+from .mbcssm import SJISSMModel</ins>
  import constants, sys
--from constants import eStart, eError, eItsMe
-+from .constants import eStart, eError, eItsMe
+<del>-from constants import eStart, eError, eItsMe</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
 
  class SJISProber(MultiByteCharSetProber):
      def __init__(self):
@@ -508,14 +511,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from latin1prober import Latin1Prober # windows-1252
--from mbcsgroupprober import MBCSGroupProber # multi-byte character sets
--from sbcsgroupprober import SBCSGroupProber # single-byte character sets
--from escprober import EscCharSetProber # ISO-2122, etc.
-+from .latin1prober import Latin1Prober # windows-1252
-+from .mbcsgroupprober import MBCSGroupProber # multi-byte character sets
-+from .sbcsgroupprober import SBCSGroupProber # single-byte character sets
-+from .escprober import EscCharSetProber # ISO-2122, etc.
+<del>-from latin1prober import Latin1Prober # windows-1252</del>
+<del>-from mbcsgroupprober import MBCSGroupProber # multi-byte character sets</del>
+<del>-from sbcsgroupprober import SBCSGroupProber # single-byte character sets</del>
+<del>-from escprober import EscCharSetProber # ISO-2122, etc.</del>
+<ins>+from .latin1prober import Latin1Prober # windows-1252</ins>
+<ins>+from .mbcsgroupprober import MBCSGroupProber # multi-byte character sets</ins>
+<ins>+from .sbcsgroupprober import SBCSGroupProber # single-byte character sets</ins>
+<ins>+from .escprober import EscCharSetProber # ISO-2122, etc.</ins>
  import re
 
  MINIMUM_THRESHOLD = 0.20
@@ -525,14 +528,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  ######################### END LICENSE BLOCK #########################
 
  import constants, sys
--from constants import eStart, eError, eItsMe
--from charsetprober import CharSetProber
--from codingstatemachine import CodingStateMachine
--from mbcssm import UTF8SMModel
-+from .constants import eStart, eError, eItsMe
-+from .charsetprober import CharSetProber
-+from .codingstatemachine import CodingStateMachine
-+from .mbcssm import UTF8SMModel
+<del>-from constants import eStart, eError, eItsMe</del>
+<del>-from charsetprober import CharSetProber</del>
+<del>-from codingstatemachine import CodingStateMachine</del>
+<del>-from mbcssm import UTF8SMModel</del>
+<ins>+from .constants import eStart, eError, eItsMe</ins>
+<ins>+from .charsetprober import CharSetProber</ins>
+<ins>+from .codingstatemachine import CodingStateMachine</ins>
+<ins>+from .mbcssm import UTF8SMModel</ins>
 
  ONE_CHAR_PROB = 0.5
 
@@ -579,8 +582,8 @@ RefactoringTool: Skipping implicit fixer: ws_comma
  count = 0
  u = UniversalDetector()
  for f in glob.glob(sys.argv[1]):
--    print f.ljust(60),
-+    print(f.ljust(60), end=' ')
+<del>-    print f.ljust(60),</del>
+<ins>+    print(f.ljust(60), end=' ')</ins>
      u.reset()
      for line in file(f, 'rb'):
          u.feed(line)
@@ -588,14 +591,14 @@ RefactoringTool: Skipping implicit fixer: ws_comma
      u.close()
      result = u.result
      if result['encoding']:
--        print result['encoding'], 'with confidence', result['confidence']
-+        print(result['encoding'], 'with confidence', result['confidence'])
+<del>-        print result['encoding'], 'with confidence', result['confidence']</del>
+<ins>+        print(result['encoding'], 'with confidence', result['confidence'])</ins>
      else:
--        print '******** no result'
-+        print('******** no result')
+<del>-        print '******** no result'</del>
+<ins>+        print('******** no result')</ins>
      count += 1
--print count, 'tests'
-+print(count, 'tests')
+<del>-print count, 'tests'</del>
+<ins>+print(count, 'tests')</ins>
 RefactoringTool: Files that were modified:
 RefactoringTool: test.py</samp></pre>
 <p id=skip2to3outputtest>Well, that wasn&#8217;t so hard. Just a few imports and print statements to convert. Time to run the new version. Do you think it&#8217;ll work?
@@ -648,7 +651,7 @@ import sys</code></pre>
 <p>There are variations of this problem scattered throughout the <code class=filename>chardet</code> library. In some places it&#8217;s "<code>import constants, sys</code>"; in other places, it&#8217;s "<code>import constants, re</code>". The fix is the same: manually split the import statement into two lines, one for the relative import, the other for the absolute import.
 <p>Onward!
 <h3 id=namefileisnotdefined>Name '<var>file</var>' is not defined</h3>
-<p>FIXME intro
+<p>And here we go again, running <code>test.py</code> to try to execute our test cases&hellip;</p>
 <p class=skip><a href=#skipnamefileisnotdefined>skip over this</a>
 <pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
 <samp>tests\ascii\howto.diveintomark.org.xml</samp>
@@ -661,7 +664,7 @@ NameError: name 'file' is not defined</samp></pre>
 <pre><code>for line in open(f, 'rb'):</code></pre>
 <p>And that&#8217;s all I have to say about that.
 <h3 id=cantuseastringpattern>Can&#8217;t use a string pattern on a bytes-like object</h3>
-<p>FIXME intro
+<p>Now things are starting to get interesting. And by &#8220;interesting,&#8221; I mean &#8220;confusing as all hell.&#8221;
 <p class=skip><a href=#skipcantuseastringpattern>skip over this</a>
 <pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
 <samp>tests\ascii\howto.diveintomark.org.xml</samp>
@@ -671,8 +674,8 @@ NameError: name 'file' is not defined</samp></pre>
   File "C:\home\chardet\chardet\universaldetector.py", line 98, in feed
     if self._highBitDetector.search(aBuf):
 TypeError: can't use a string pattern on a bytes-like object</samp></pre>
-<p id=skipcantuseastringpattern>Now things are starting to get interesting. And by &#8220;interesting,&#8221; I mean &#8220;confusing as all hell.&#8221;
-<p>First, let&#8217;s see what <var>self._highBitDetector</var> is. It&#8217;s defined in the <var>__init__</var> method of the <var>UniversalDetector</var> class:
+<p id=skipcantuseastringpattern>
+<p>To debug this, let&#8217;s see what <var>self._highBitDetector</var> is. It&#8217;s defined in the <var>__init__</var> method of the <var>UniversalDetector</var> class:
 <p class=skip><a href=#skiphighbitdetectorcode>skip over this</a>
 <pre><code>class UniversalDetector:
     def __init__(self):
@@ -687,7 +690,7 @@ TypeError: can't use a string pattern on a bytes-like object</samp></pre>
     .
     if self._mInputState == ePureAscii:
         if self._highBitDetector.search(aBuf):</code></pre>
-<p id=skipfeedhighbitdetectorcode>And what is <var>aBuf</var>?  Let&#8217;s backtrack further to a place that calls <var>UniversalDetector.feed()</var>. One place that calls it is the test harness, <code class=filename>test.py</code>.
+<p id=skipfeedhighbitdetectorcode>And what is <var>aBuf</var>?  Let&#8217;s backtrack further to a place that calls <code>UniversalDetector.feed()</code>. One place that calls it is the test harness, <code class=filename>test.py</code>.
 <p class=skip><a href=#skiptestharnessfeedcode>skip over this</a>
 <pre><code>u = UniversalDetector()
 .
@@ -695,7 +698,7 @@ TypeError: can't use a string pattern on a bytes-like object</samp></pre>
 .
 for line in open(f, 'rb'):
     u.feed(line)</code></pre>
-<p id=skiptestharnessfeedcode>And here we find our answer: in the <var>UniversalDetector.feed()</var> method, <var>aBuf</var> is a line read from a file on disk. Look carefully at the parameters used to open the file: <code>'rb'</code>. <code>'r'</code> is for &#8220;read&#8221;; OK, big deal, we&#8217;re reading the file. Ah, but <code>'b'</code> is for &#8220;binary.&#8221;  Without the <code>'b'</code> flag, this <code>for</code> loop would read the file, line by line, and convert each line into a string -- an array of Unicode characters -- according to the system default character encoding. (You could override the system encoding with another parameter to <var>open()</var>, but never mind that for now.)  But with the <code>'b'</code> flag, this <code>for</code> loop reads the file, line by line, and stores each line exactly as it appears in the file, as an array of bytes. That byte array gets passed to <var>UniversalDetector.feed()</var>, and eventually gets passed to the pre-compiled regular expression, <var>self._highBitDetector</var>, to search for high-bit... characters. But we don&#8217;t have characters; we have bytes. Oops.
+<p id=skiptestharnessfeedcode>And here we find our answer: in the <code>UniversalDetector.feed()</code> method, <var>aBuf</var> is a line read from a file on disk. Look carefully at the parameters used to open the file: <code>'rb'</code>. <code>'r'</code> is for &#8220;read&#8221;; OK, big deal, we&#8217;re reading the file. Ah, but <code>'b'</code> is for &#8220;binary.&#8221;  Without the <code>'b'</code> flag, this <code>for</code> loop would read the file, line by line, and convert each line into a string -- an array of Unicode characters -- according to the system default character encoding. (You could override the system encoding with another parameter to <var>open()</var>, but never mind that for now.)  But with the <code>'b'</code> flag, this <code>for</code> loop reads the file, line by line, and stores each line exactly as it appears in the file, as an array of bytes. That byte array gets passed to <code>UniversalDetector.feed()</code>, and eventually gets passed to the pre-compiled regular expression, <var>self._highBitDetector</var>, to search for high-bit... characters. But we don&#8217;t have characters; we have bytes. Oops.
 <p>What we need this regular expression to search is not an array of characters, but an array of bytes.
 <p>Once you realize that, the solution is not difficult. Regular expressions defined with strings can search strings. Regular expressions defined with byte arrays can search byte arrays. To define a byte array pattern, we simply change the type of the argument we use to define the regular expression to a byte array. So instead of this:
 <pre><code>self._highBitDetector = re.compile(r'[\x80-\xFF]')</code></pre>
@@ -716,7 +719,202 @@ for line in open(f, 'rb'):
   File "C:\home\chardet\chardet\universaldetector.py", line 100, in feed
     elif (self._mInputState == ePureAscii) and self._escDetector.search(self._mLastChar + aBuf):
 TypeError: Can't convert 'bytes' object to str implicitly</samp></pre>
-<p id=skipcantconvertbytesobject>...
+
+<p id=skipcantconvertbytesobject>There's an unfortunate clash of coding style and Python interpreter here. The <code>TypeError</code> could be anywhere on that line, but the traceback doesn't tell you exactly where it is. It could be in the first conditional or the second, and the traceback would look the same. To narrow it down, you should split the line in half, like this:
+
+<p class=skip><a href=#skip-split-conditional>skip over this code listing</a>
+<pre><code>elif (self._mInputState == ePureAscii) and \
+    self._escDetector.search(self._mLastChar + aBuf):</code></pre>
+
+<p id=skip-split-conditional>And re-run the test:</p>
+
+<p class=skip><a href=#skip-cant-convert-bytes-object-2>skip over this command output listing</a>
+<pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
+<samp>tests\ascii\howto.diveintomark.org.xml</samp>
+<samp class=traceback>Traceback (most recent call last):
+  File "test.py", line 10, in &lt;module>
+    u.feed(line)
+  File "C:\home\chardet\chardet\universaldetector.py", line 101, in feed
+    self._escDetector.search(self._mLastChar + aBuf):
+TypeError: Can't convert 'bytes' object to str implicitly</samp></pre>
+
+<p id=skip-over-cant-convert-bytes-object-2>Aha! The problem was not in the first conditional (<code>self._mInputState == ePureAscii</code>) but in the second one. So what could cause a <code>TypeError</code> there? Perhaps you're thinking that the <code>search()</code> method is expecting a value of a different type, but that wouldn't generate this traceback. Python functions can take any value; if you pass the right number of arguments, the function will execute. It may <em>crash</em> if you pass it a value of a different type than it's expecting, but if that happened, the traceback would point to somewhere inside the function. But this traceback says it never got as far as calling the <code>search()</code> method. So the problem must be in that <code>+</code> operation, as it's trying to construct the value that it will eventually pass to the <code>search()</code> method.
+
+<p>We know from <a href="#cantuseastringpattern">previous debugging</a> that <var>aBuf</var> is a byte array. So what is <code>self._mLastChar</code>? It's an instance variable, defined in the <code>reset()</code> method, which is actually called from the <code>__init__()</code> method.
+
+<p class=skip><a href=#skip-mlastchar-declaration>skip over this code listing</a>
+<pre><code>class UniversalDetector:
+    def __init__(self):
+        self._highBitDetector = re.compile(b'[\x80-\xFF]')
+        self._escDetector = re.compile(b'(\033|~{)')
+        self._mEscCharSetProber = None
+        self._mCharSetProbers = []
+<mark>        self.reset()</mark>
+
+    def reset(self):
+        self.result = {'encoding': None, 'confidence': 0.0}
+        self.done = False
+        self._mStart = True
+        self._mGotData = False
+        self._mInputState = ePureAscii
+<mark>        self._mLastChar = ''</mark></code></pre>
+
+<p id=skip-mlastchar-declaration>And now we have our answer. Do you see it? <var>self._mLastChar</var> is a string, but <var>aBuf</var> is a byte array. And you can't concatenate a string to a byte array &mdash; not even a zero-length string.
+
+<p>So what is <var>self._mLastChar</var> anyway? The answer is in the <code>feed()</code> method, just a few lines down from where the trackback occurred.
+
+<p class=skip><a href=#skip-mlastchar-set>skip over this code listing</a>
+<pre><code>if self._mInputState == ePureAscii:
+    if self._highBitDetector.search(aBuf):
+        self._mInputState = eHighbyte
+    elif (self._mInputState == ePureAscii) and \
+            self._escDetector.search(self._mLastChar + aBuf):
+        self._mInputState = eEscAscii
+
+<mark>self._mLastChar = aBuf[-1]</mark></code></pre>
+
+<p>The calling function calls this <code>feed()</code> method over and over again with a few bytes at a time. The method processes the bytes it was given (passed in as <var>aBuf</var>), then stores the last byte in <var>self._mLastChar</var> in case it's needed during the next call. (In a multi-byte encoding, the <code>feed()</code> method might get called with half of a character, then called again with the other half.)  But because <var>aBuf</var> is now a byte array instead of a string, <var>self._mLastChar</var> needs to be a byte array as well. Thus:
+
+<pre><code>  def reset(self):
+      .
+      .
+      .
+<del>-     self._mLastChar = ''</del>
+<ins>+     self._mLastChar = b''</ins></code></pre>
+
+<h3 id=unsupportedoperandtypeforplus>TypeError: unsupported operand type(s) for +: 'int' and 'bytes'</h3>
+
+<p>I have good news, and I have bad news. The good news is we're making progress&hellip;
+
+<p class=skip><a href=#skip-unsupported-operand-types>skip over this command listing</a>
+<pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
+<samp>tests\ascii\howto.diveintomark.org.xml</samp>
+<samp class=traceback>Traceback (most recent call last):
+  File "test.py", line 10, in &lt;module>
+    u.feed(line)
+  File "C:\home\chardet\chardet\universaldetector.py", line 101, in feed
+    self._escDetector.search(self._mLastChar + aBuf):
+TypeError: unsupported operand type(s) for +: 'int' and 'bytes'</samp></pre>
+
+<p id=skip-unsupported-operand-types>&hellip;The bad news is it doesn't always feel like progress.
+
+<p>But this is progress! Really! Even though the traceback calls out the same line of code, it's a different error than it used to be. Progress! So what's the problem now? The last time I checked, this line of code didn't try to concatenate an <code>int</code> with a byte array (<code>bytes</code>). In fact, you just spent a lot of time <a href="#cantconvertbytesobject">ensuring that <var>self._mLastChar</var> was a byte array</a>. How did it turn into an <code>int</code>?
+
+<p>The answer lies not in the previous lines of code, but in the following lines.
+
+<p class=skip><a href=#skip-mlastchar-highlight>skip over this code listing</a>
+<pre><code>if self._mInputState == ePureAscii:
+    if self._highBitDetector.search(aBuf):
+        self._mInputState = eHighbyte
+    elif (self._mInputState == ePureAscii) and \
+            self._escDetector.search(self._mLastChar + aBuf):
+        self._mInputState = eEscAscii
+
+<mark>self._mLastChar = aBuf[-1]</mark></code></pre>
+
+<p id=skip-mlastchar-highlight>This error doesn't occur the first time the <code>feed()</code> method gets called; it occurs the <em>second time</em>, after <var>self._mLastChar</var> has been set to the last byte of <var>aBuf</var>. Well, what's the problem with that? Getting a single element from a byte array yields an integer, not a byte array. To see the difference, follow me to the interactive shell:
+
+<p class=skip><a href=#skip-mlastchar-interactive>skip over this interpreter listing</a>
+<pre class=screen>
+<a><samp class=prompt>>>> </samp><kbd>aBuf = b'\xEF\xBB\xBF'</kbd>         <span>&#x2460;</span></a>
+<samp class=prompt>>>> </samp><kbd>len(aBuf)</kbd>
+<samp>3</samp>
+<samp class=prompt>>>> </samp><kbd>mLastChar = aBuf[-1]</kbd>
+<a><samp class=prompt>>>> </samp><kbd>mLastChar</kbd>                      <span>&#x2461;</span></a>
+<samp>191</samp>
+<a><samp class=prompt>>>> </samp><kbd>type(mLastChar)</kbd>                <span>&#x2462;</span></a>
+<samp>&lt;class 'int'></samp>
+<a><samp class=prompt>>>> </samp><kbd>mLastChar + aBuf</kbd>               <span>&#x2463;</span></a>
+<samp class=traceback>Traceback (most recent call last):
+  File "<stdin>", line 1, in &lt;module>
+TypeError: unsupported operand type(s) for +: 'int' and 'bytes'</samp>
+<a><samp class=prompt>>>> </samp><kbd>mLastChar = aBuf[-1:]</kbd>          <span>&#x2464;</span></a>
+<samp class=prompt>>>> </samp><kbd>mLastChar</kbd>
+<samp>b'\xbf'</samp>
+<a><samp class=prompt>>>> </samp><kbd>mLastChar + aBuf</kbd>               <span>&#x2465;</span></a>
+<samp>b'\xbf\xef\xbb\xbf'</samp></pre>
+<ol id=skip-mlastchar-interactive>
+<li>Define a byte array of 3 bytes.
+<li>The last element of the byte array is 191.
+<li>That's an integer.
+<li>Concatenating an integer with a byte array doesn't work. You've now replicated the error you just found in <code>universaldetector.py</code>.
+<li>Ah, here's the fix. Instead of taking the last element of the byte array, use <a href=native-datatypes.html#slicinglists>list slicing</a> to create a new byte array containing just the last element. That is, start with the last element and continue the slice until the end of the byte array. Now <var>mLastChar</var> is a byte array of length 1.
+<li>Concatenating a byte array of length 1 with a byte array of length 3 returns a new byte array of length 4.
+</ol>
+
+<p>So, to ensure that the <code>feed()</code> method in <code>universaldetector.py</code> continues to work no matter how often it's called, you need to <a href=#cantconvertbytesobject>initialize <var>self._mLastChar</var> as a 0-length byte array</a>, then <em>make sure it stays a byte array</em>.
+
+<pre><code>              self._escDetector.search(self._mLastChar + aBuf):
+          self._mInputState = eEscAscii
+
+<del>- self._mLastChar = aBuf[-1]</del>
+<ins>+ self._mLastChar = aBuf[-1:]</ins></code></pre>
+
+<h3 id=ordexpectedstring>TypeError: ord() expected string of length 1, but int found</h3>
+
+<p>Tired yet? You're almost there&hellip;
+
+<p class=skip><a href=#skip-ord-expected-string>skip over this command output listing</a>
+<pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
+<samp>tests\ascii\howto.diveintomark.org.xml                       ascii with confidence 1.0
+tests\Big5\0804.blogspot.com.xml</samp>
+<samp class=traceback>Traceback (most recent call last):
+  File "test.py", line 10, in &lt;module>
+    u.feed(line)
+  File "C:\home\chardet\chardet\universaldetector.py", line 116, in feed
+    if prober.feed(aBuf) == constants.eFoundIt:
+  File "C:\home\chardet\chardet\charsetgroupprober.py", line 60, in feed
+    st = prober.feed(aBuf)
+  File "C:\home\chardet\chardet\utf8prober.py", line 53, in feed
+    codingState = self._mCodingSM.next_state(c)
+  File "C:\home\chardet\chardet\codingstatemachine.py", line 43, in next_state
+    byteCls = self._mModel['classTable'][ord(c)]
+TypeError: ord() expected string of length 1, but int found</samp></pre>
+
+<p id=skip-ord-expected-string>FIXME
+
+<p class=skip><a href=#skip-next-state>skip over this code listing</a>
+<pre><code># codingstatemachine.py
+def next_state(self, c):
+    # for each byte we get its class
+    # if it is first byte, we also get byte length
+    byteCls = self._mModel['classTable'][ord(c)]</code></pre>
+
+<p id=skip-next-state>FIXME [<var>aBuf</var> is a byte array, so <var>c</var> is an <code>int</code>, not a 1-character string. IOW, there's no need to call the <code>ord()</code> function because <var>c</var> is already an <code>int</code>!]
+
+<p class=skip><a href=#skip-utf8prober-feed>skip over this code listing</a>
+<pre><code># utf8prober.py
+def feed(self, aBuf):
+    for c in aBuf:
+        codingState = self._mCodingSM.next_state(c)</code></pre>
+
+<p id=skip-utf8prober-feed>FIXME [wrapup or deleteme]
+
+<h3 id=unorderabletypes>TypeError: unorderable types: int() >= str()</h3>
+
+<p>FIXME [let's go again]
+
+<p class=skip><a href=#skip-unorderable-types-screen>skip over this command output listing</a>
+<pre class=screen><samp class=prompt>C:\home\chardet> </samp><kbd>python test.py tests\*\*</kbd>
+<samp>tests\ascii\howto.diveintomark.org.xml                       ascii with confidence 1.0
+tests\Big5\0804.blogspot.com.xml</samp>
+<samp>Traceback (most recent call last):
+  File "test.py", line 10, in &lt;module>
+    u.feed(line)
+  File "C:\home\chardet\chardet\universaldetector.py", line 116, in feed
+    if prober.feed(aBuf) == constants.eFoundIt:
+  File "C:\home\chardet\chardet\charsetgroupprober.py", line 60, in feed
+    st = prober.feed(aBuf)
+  File "C:\home\chardet\chardet\sjisprober.py", line 68, in feed
+    self._mContextAnalyzer.feed(self._mLastChar[2 - charLen :], charLen)
+  File "C:\home\chardet\chardet\jpcntx.py", line 145, in feed
+    order, charLen = self.get_order(aBuf[i:i+2])
+  File "C:\home\chardet\chardet\jpcntx.py", line 176, in get_order
+    if ((aStr[0] >= '\x81') and (aStr[0] <= '\x9F')) or \
+TypeError: unorderable types: int() >= str()</samp></pre>
+
+<p id=skip-unorderable-types-screen>FIXME
+
 <p class=c>&copy; 2001&ndash;4, 2009 <span>&#x2133;</span>ark Pilgrim, <a href=http://creativecommons.org/licenses/by-sa/3.0/ rel=license>CC-BY-SA-3.0</a>
 <script src=jquery.js></script>
 <script src=dip3.js></script>
diff --git a/chardet/chardet/__init__.pyc b/chardet/chardet/__init__.pyc
index a991c54..d5024df 100644
Binary files a/chardet/chardet/__init__.pyc and b/chardet/chardet/__init__.pyc differ
diff --git a/chardet/chardet/big5freq.pyc b/chardet/chardet/big5freq.pyc
index 7552252..6f6a6af 100644
Binary files a/chardet/chardet/big5freq.pyc and b/chardet/chardet/big5freq.pyc differ
diff --git a/chardet/chardet/big5prober.pyc b/chardet/chardet/big5prober.pyc
index 522ab5d..5cd8f7d 100644
Binary files a/chardet/chardet/big5prober.pyc and b/chardet/chardet/big5prober.pyc differ
diff --git a/chardet/chardet/chardistribution.pyc b/chardet/chardet/chardistribution.pyc
index 4dc7697..c9ed078 100644
Binary files a/chardet/chardet/chardistribution.pyc and b/chardet/chardet/chardistribution.pyc differ
diff --git a/chardet/chardet/charsetgroupprober.pyc b/chardet/chardet/charsetgroupprober.pyc
index ed6b38f..9887ef5 100644
Binary files a/chardet/chardet/charsetgroupprober.pyc and b/chardet/chardet/charsetgroupprober.pyc differ
diff --git a/chardet/chardet/charsetprober.pyc b/chardet/chardet/charsetprober.pyc
index f1bd064..9550a50 100644
Binary files a/chardet/chardet/charsetprober.pyc and b/chardet/chardet/charsetprober.pyc differ
diff --git a/chardet/chardet/codingstatemachine.pyc b/chardet/chardet/codingstatemachine.pyc
index 9f44854..e02d8bb 100644
Binary files a/chardet/chardet/codingstatemachine.pyc and b/chardet/chardet/codingstatemachine.pyc differ
diff --git a/chardet/chardet/constants.pyc b/chardet/chardet/constants.pyc
index e7cd4fc..ae83f2c 100644
Binary files a/chardet/chardet/constants.pyc and b/chardet/chardet/constants.pyc differ
diff --git a/chardet/chardet/escprober.pyc b/chardet/chardet/escprober.pyc
index 5564ff1..fb025d0 100644
Binary files a/chardet/chardet/escprober.pyc and b/chardet/chardet/escprober.pyc differ
diff --git a/chardet/chardet/escsm.pyc b/chardet/chardet/escsm.pyc
index 1b97ea4..bc66e0b 100644
Binary files a/chardet/chardet/escsm.pyc and b/chardet/chardet/escsm.pyc differ
diff --git a/chardet/chardet/eucjpprober.pyc b/chardet/chardet/eucjpprober.pyc
index 3810fde..019edc8 100644
Binary files a/chardet/chardet/eucjpprober.pyc and b/chardet/chardet/eucjpprober.pyc differ
diff --git a/chardet/chardet/euckrfreq.pyc b/chardet/chardet/euckrfreq.pyc
index ba11667..2b7c2c4 100644
Binary files a/chardet/chardet/euckrfreq.pyc and b/chardet/chardet/euckrfreq.pyc differ
diff --git a/chardet/chardet/euckrprober.pyc b/chardet/chardet/euckrprober.pyc
index d9e33a5..ba8b4ac 100644
Binary files a/chardet/chardet/euckrprober.pyc and b/chardet/chardet/euckrprober.pyc differ
diff --git a/chardet/chardet/euctwfreq.pyc b/chardet/chardet/euctwfreq.pyc
index ee0826e..e586f56 100644
Binary files a/chardet/chardet/euctwfreq.pyc and b/chardet/chardet/euctwfreq.pyc differ
diff --git a/chardet/chardet/euctwprober.pyc b/chardet/chardet/euctwprober.pyc
index 2133083..41d576a 100644
Binary files a/chardet/chardet/euctwprober.pyc and b/chardet/chardet/euctwprober.pyc differ
diff --git a/chardet/chardet/gb2312freq.pyc b/chardet/chardet/gb2312freq.pyc
index c3e5c5a..4df57b1 100644
Binary files a/chardet/chardet/gb2312freq.pyc and b/chardet/chardet/gb2312freq.pyc differ
diff --git a/chardet/chardet/gb2312prober.pyc b/chardet/chardet/gb2312prober.pyc
index 89356b6..c200bb9 100644
Binary files a/chardet/chardet/gb2312prober.pyc and b/chardet/chardet/gb2312prober.pyc differ
diff --git a/chardet/chardet/hebrewprober.pyc b/chardet/chardet/hebrewprober.pyc
index 5546ae7..5788cf3 100644
Binary files a/chardet/chardet/hebrewprober.pyc and b/chardet/chardet/hebrewprober.pyc differ
diff --git a/chardet/chardet/jisfreq.pyc b/chardet/chardet/jisfreq.pyc
index 4259ec3..899285b 100644
Binary files a/chardet/chardet/jisfreq.pyc and b/chardet/chardet/jisfreq.pyc differ
diff --git a/chardet/chardet/jpcntx.pyc b/chardet/chardet/jpcntx.pyc
index 7adf578..455f6e8 100644
Binary files a/chardet/chardet/jpcntx.pyc and b/chardet/chardet/jpcntx.pyc differ
diff --git a/chardet/chardet/langbulgarianmodel.pyc b/chardet/chardet/langbulgarianmodel.pyc
index 5fc684c..65b8196 100644
Binary files a/chardet/chardet/langbulgarianmodel.pyc and b/chardet/chardet/langbulgarianmodel.pyc differ
diff --git a/chardet/chardet/langcyrillicmodel.pyc b/chardet/chardet/langcyrillicmodel.pyc
index 41d0a9f..ad465ee 100644
Binary files a/chardet/chardet/langcyrillicmodel.pyc and b/chardet/chardet/langcyrillicmodel.pyc differ
diff --git a/chardet/chardet/langgreekmodel.pyc b/chardet/chardet/langgreekmodel.pyc
index 55aa44b..0012470 100644
Binary files a/chardet/chardet/langgreekmodel.pyc and b/chardet/chardet/langgreekmodel.pyc differ
diff --git a/chardet/chardet/langhebrewmodel.pyc b/chardet/chardet/langhebrewmodel.pyc
index 0b9e814..369dc9e 100644
Binary files a/chardet/chardet/langhebrewmodel.pyc and b/chardet/chardet/langhebrewmodel.pyc differ
diff --git a/chardet/chardet/langhungarianmodel.pyc b/chardet/chardet/langhungarianmodel.pyc
index b2f02c1..cf25b16 100644
Binary files a/chardet/chardet/langhungarianmodel.pyc and b/chardet/chardet/langhungarianmodel.pyc differ
diff --git a/chardet/chardet/langthaimodel.pyc b/chardet/chardet/langthaimodel.pyc
index c29e8de..38b86d7 100644
Binary files a/chardet/chardet/langthaimodel.pyc and b/chardet/chardet/langthaimodel.pyc differ
diff --git a/chardet/chardet/latin1prober.pyc b/chardet/chardet/latin1prober.pyc
index 869b031..4b38eff 100644
Binary files a/chardet/chardet/latin1prober.pyc and b/chardet/chardet/latin1prober.pyc differ
diff --git a/chardet/chardet/mbcharsetprober.pyc b/chardet/chardet/mbcharsetprober.pyc
index 3b796fa..ba52fba 100644
Binary files a/chardet/chardet/mbcharsetprober.pyc and b/chardet/chardet/mbcharsetprober.pyc differ
diff --git a/chardet/chardet/mbcsgroupprober.pyc b/chardet/chardet/mbcsgroupprober.pyc
index 8eed604..5f03d2c 100644
Binary files a/chardet/chardet/mbcsgroupprober.pyc and b/chardet/chardet/mbcsgroupprober.pyc differ
diff --git a/chardet/chardet/mbcssm.pyc b/chardet/chardet/mbcssm.pyc
index 1db05cc..b04c2da 100644
Binary files a/chardet/chardet/mbcssm.pyc and b/chardet/chardet/mbcssm.pyc differ
diff --git a/chardet/chardet/sbcharsetprober.pyc b/chardet/chardet/sbcharsetprober.pyc
index c8b8672..b0bad59 100644
Binary files a/chardet/chardet/sbcharsetprober.pyc and b/chardet/chardet/sbcharsetprober.pyc differ
diff --git a/chardet/chardet/sbcsgroupprober.pyc b/chardet/chardet/sbcsgroupprober.pyc
index 857deca..6ec3e06 100644
Binary files a/chardet/chardet/sbcsgroupprober.pyc and b/chardet/chardet/sbcsgroupprober.pyc differ
diff --git a/chardet/chardet/sjisprober.pyc b/chardet/chardet/sjisprober.pyc
index 6a81164..f5b3a96 100644
Binary files a/chardet/chardet/sjisprober.pyc and b/chardet/chardet/sjisprober.pyc differ
diff --git a/chardet/chardet/universaldetector.pyc b/chardet/chardet/universaldetector.pyc
index 43c3a05..73669a3 100644
Binary files a/chardet/chardet/universaldetector.pyc and b/chardet/chardet/universaldetector.pyc differ
diff --git a/chardet/chardet/utf8prober.pyc b/chardet/chardet/utf8prober.pyc
index 9811837..9303ce9 100644
Binary files a/chardet/chardet/utf8prober.pyc and b/chardet/chardet/utf8prober.pyc differ
diff --git a/chardet/python3-conversion-notes.txt b/chardet/python3-conversion-notes.txt
index 3f7c7e7..5f74a32 100644
--- a/chardet/python3-conversion-notes.txt
+++ b/chardet/python3-conversion-notes.txt
@@ -10,11 +10,9 @@
     import sys
 * test.py: change file() to open()
 * universaldetector.py: change r'' strings to b'' byte arrays in self._highBitDetector, self._escDetector regular expressions
-- charsetprober.py: change regular expression-based replace to use b'' byte arrays instead of strings
 
-- universaldetector.py: change self._mLastChar from a r'' string to a b'' byte array
-- mbcharsetprober.py: change self._mLastChar from a list of two 1-character strings to a list of two ints
-- universaldetector.py: getting a single element from a byte array yields an integer, not a byte, so change syntax to make sure we self._mLastChar is always a byte
+* universaldetector.py: change self._mLastChar from a '' string to a b'' byte array
+* universaldetector.py: getting a single element from a byte array yields an integer, not a byte, so change syntax to make sure we self._mLastChar is always a byte
   old:
     self._mLastChar = aBuf[-1]
   new:
@@ -25,4 +23,8 @@
 - jpcntx.py, chardistribution.py (editorial): global search-and-replace "aStr" --> "aBuf" to make it clear that we're passing around a byte array
 - sbcharsetprober.py, latin1prober.py: change ord(c) to c since it's already an int (iterating through a byte array)
 
+- (not sure where this fits) mbcharsetprober.py: change self._mLastChar from a list of two 1-character strings to a list of two ints
+
+- (not sure where this fits) charsetprober.py: change regular expression-based replace to use b'' byte arrays instead of strings
+
 - latin1prober.py: refactor reduce(operator.add, ...) to use a for loop instead
diff --git a/dip2 b/dip2
index 3fa4ea4..4c15027 100644
--- a/dip2
+++ b/dip2
@@ -291,14 +291,14 @@
 <p>The first thing you need to do with Python is install it. Or do you?
 <p>If you're using an account on a hosted server, your ISP may have already installed Python. Most popular Linux distributions come with Python in the default installation. Mac OS X 10.2 and later includes a command-line version of Python, although you'll probably want to install a version that includes a more Mac-like graphical interface.
 <p>Windows does not come with any version of Python, but don't despair!  There are several ways to point-and-click your way to Python on Windows.
-<p>As you can see already, Python runs on a great many operating systems. The full list includes Windows, Mac OS, Mac OS X, and all varieties of free <acronym>UNIX</acronym>-compatible systems like Linux. There are also versions that run on Sun Solaris, AS/400, Amiga, OS/2, BeOS, and a plethora
+<p>As you can see already, Python runs on a great many operating systems. The full list includes Windows, Mac OS, Mac OS X, and all varieties of free <abbr>UNIX</abbr>-compatible systems like Linux. There are also versions that run on Sun Solaris, AS/400, Amiga, OS/2, BeOS, and a plethora
 of other platforms you've probably never even heard of.
 <p>What's more, Python programs written on one platform can, with a little care, run on <em>any</em> supported platform. For instance, I regularly develop Python programs on Windows and later deploy them on Linux.
 <p>So back to the question that started this section, &#8220;Which Python is right for you?&#8221;  The answer is whichever one runs on the computer you already have.
 <h2 id="install.windows">1.2. Python on Windows</h2>
 <p>On Windows, you have a couple choices for installing Python.
-<p>ActiveState makes a Windows installer for Python called ActivePython, which includes a complete version of Python, an <acronym>IDE</acronym> with a Python-aware code editor, plus some Windows extensions for Python that allow complete access to Windows-specific services, <acronym>API</acronym>s, and the Windows Registry.
-<p>ActivePython is freely downloadable, although it is not open source. It is the <acronym>IDE</acronym> I used to learn Python, and I recommend you try it unless you have a specific reason not to. One such reason might be that ActiveState is generally
+<p>ActiveState makes a Windows installer for Python called ActivePython, which includes a complete version of Python, an <abbr>IDE</abbr> with a Python-aware code editor, plus some Windows extensions for Python that allow complete access to Windows-specific services, <abbr>API</abbr>s, and the Windows Registry.
+<p>ActivePython is freely downloadable, although it is not open source. It is the <abbr>IDE</abbr> I used to learn Python, and I recommend you try it unless you have a specific reason not to. One such reason might be that ActiveState is generally
 several months behind in updating their ActivePython installer when new version of Python are released. If you absolutely need the latest version of Python and ActivePython is still a version behind as you read this, you'll want to use the second option for installing Python on Windows.
 <p>The second option is the &#8220;official&#8221; Python installer, distributed by the people who develop Python itself. It is freely downloadable and open source, and it is always current with the latest version of Python.
 <div class=procedure>
@@ -368,7 +368,7 @@ IDLE 1.0</samp>
 </pre><h2 id="install.macosx">1.3. Python on Mac OS X</h2>
 <p>On Mac OS X, you have two choices for installing Python: install it, or don't install it. You probably want to install it.
 <p>Mac OS X 10.2 and later comes with a command-line version of Python preinstalled. If you are comfortable with the command line, you can use this version for the first third of the book. However,
-the preinstalled version does not come with an <acronym>XML</acronym> parser, so when you get to the <acronym>XML</acronym> chapter, you'll need to install the full version.
+the preinstalled version does not come with an <abbr>XML</abbr> parser, so when you get to the <abbr>XML</abbr> chapter, you'll need to install the full version.
 <p>Rather than using the preinstalled version, you'll probably want to install the latest version, which also comes with a graphical
 interactive shell.
 <div class=procedure>
@@ -426,7 +426,7 @@ Type "help", "copyright", "credits", or "license" for more information.</samp>
 <p>Double-click <code>PythonIDE</code> to launch Python.
 
 </ol>
-<p>The MacPython <acronym>IDE</acronym> should display a splash screen, then take you to the interactive shell. If the interactive shell does not appear, select
+<p>The MacPython <abbr>IDE</abbr> should display a splash screen, then take you to the interactive shell. If the interactive shell does not appear, select
 Window->Python Interactive (<kbd class=shortcut>Cmd-0</kbd>). The opening window will look something like this:
 <pre class=screen>
 <samp>Python 2.3 (#2, Jul 30 2003, 11:45:28)
@@ -475,7 +475,7 @@ Type "help", "copyright", "credits", or "license" for more information.</samp>
 <p>Double-click <code>Python IDE</code> to launch Python.
 
 </ol>
-<p>The MacPython <acronym>IDE</acronym> should display a splash screen, and then take you to the interactive shell. If the interactive shell does not appear, select
+<p>The MacPython <abbr>IDE</abbr> should display a splash screen, and then take you to the interactive shell. If the interactive shell does not appear, select
 Window->Python Interactive (<kbd class=shortcut>Cmd-0</kbd>). You'll see a screen like this:
 <pre class=screen>
 <samp>Python 2.3 (#2, Jul 30 2003, 11:45:28)
@@ -486,7 +486,7 @@ MacPython IDE 1.0.1</samp>
 </pre><h2 id="install.redhat">1.5. Python on RedHat Linux</h2>
 <p>Installing under UNIX-compatible operating systems such as Linux is easy if you're willing to install a binary package. Pre-built
 binary packages are available for most popular Linux distributions. Or you can always compile from source.
-<p>Download the latest Python <acronym>RPM</acronym> by going to <a href="http://www.python.org/ftp/python/">http://www.python.org/ftp/python/</a> and selecting the highest version number listed, then selecting the <code>rpms/</code> directory within that. Then download the <acronym>RPM</acronym> with the highest version number. You can install it with the <kbd>rpm</kbd> command, as shown here:
+<p>Download the latest Python <abbr>RPM</abbr> by going to <a href="http://www.python.org/ftp/python/">http://www.python.org/ftp/python/</a> and selecting the highest version number listed, then selecting the <code>rpms/</code> directory within that. Then download the <abbr>RPM</abbr> with the highest version number. You can install it with the <kbd>rpm</kbd> command, as shown here:
 <div class=example><h3>Example 1.2. Installing on RedHat Linux 9</h3><pre class=screen>
 <samp class=prompt>localhost:~$ </samp>su -
 <samp class=prompt>Password: </samp>[enter your root password]
@@ -516,9 +516,9 @@ Type "help", "copyright", "credits", or "license" for more information.</samp>
 <li>Whoops!  Just typing <kbd>python</kbd> gives you the older version of Python -- the one that was installed by default. That's not the one you want.
 <li>At the time of this writing, the newest version is called <kbd>python2.3</kbd>. You'll probably want to change the path on the first line of the sample scripts to point to the newer version.
 <li>This is the complete path of the newer version of Python that you just installed. Use this on the <code>#!</code> line (the first line of each script) to ensure that scripts are running under the latest version of Python, and be sure to type <kbd>python2.3</kbd> to get into the interactive shell.
-<h2 id="install.debian">1.6. Python on Debian <acronym>GNU</acronym>/Linux</h2>
-<p>If you are lucky enough to be running Debian <acronym>GNU</acronym>/Linux, you install Python through the <kbd>apt</kbd> command.
-<div class=example><h3>Example 1.3. Installing on Debian <acronym>GNU</acronym>/Linux</h3><pre class=screen>
+<h2 id="install.debian">1.6. Python on Debian <abbr>GNU</abbr>/Linux</h2>
+<p>If you are lucky enough to be running Debian <abbr>GNU</abbr>/Linux, you install Python through the <kbd>apt</kbd> command.
+<div class=example><h3>Example 1.3. Installing on Debian <abbr>GNU</abbr>/Linux</h3><pre class=screen>
 <samp class=prompt>localhost:~$ </samp>su -
 <samp class=prompt>Password: </samp>[enter your root password]
 <samp class=prompt>localhost:~# </samp>apt-get install python
@@ -640,16 +640,16 @@ if __name__ == "__main__":
     print buildConnectionString(myParams)</pre><p>Now run this program and see what happens.
 <table id="tip.run.windows" class=tip border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <acronym>IDE</acronym> on Windows, you can run the Python program you're editing by choosing
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <abbr>IDE</abbr> on Windows, you can run the Python program you're editing by choosing
 File->Run... (<kbd class=shortcut>Ctrl-R</kbd>). Output is displayed in the interactive window.
 <table id="tip.run.mac" class=tip border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the Python <acronym>IDE</acronym> on Mac OS, you can run a Python program with
-Python->Run window... (<kbd class=shortcut>Cmd-R</kbd>), but there is an important option you must set first. Open the <code>.py</code> file in the <acronym>IDE</acronym>, pop up the options menu by clicking the black triangle in the upper-right corner of the window, and make sure the Run as __main__ option is checked. This is a per-file setting, but you'll only need to do it once per file.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the Python <abbr>IDE</abbr> on Mac OS, you can run a Python program with
+Python->Run window... (<kbd class=shortcut>Cmd-R</kbd>), but there is an important option you must set first. Open the <code>.py</code> file in the <abbr>IDE</abbr>, pop up the options menu by clicking the black triangle in the upper-right corner of the window, and make sure the Run as __main__ option is checked. This is a per-file setting, but you'll only need to do it once per file.
 <table id="tip.run.unix" class=tip border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">On <acronym>UNIX</acronym>-compatible systems (including Mac OS X), you can run a Python program from the command line: <kbd>python <code>odbchelper.py</code></kbd><p>The id="odbchelper.output" output of <code>odbchelper.py</code> will look like this:<pre class=screen>server=mpilgrim;uid=sa;database=master;pwd=secret</pre><h2 id="odbchelper.funcdef">2.2. Declaring Functions</h2>
-<p>Python has functions like most other languages, but it does not have separate header files like <acronym>C++</acronym> or <code>interface</code>/<code>implementation</code> sections like Pascal. When you need a function, just declare it, like this:
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">On <abbr>UNIX</abbr>-compatible systems (including Mac OS X), you can run a Python program from the command line: <kbd>python <code>odbchelper.py</code></kbd><p>The id="odbchelper.output" output of <code>odbchelper.py</code> will look like this:<pre class=screen>server=mpilgrim;uid=sa;database=master;pwd=secret</pre><h2 id="odbchelper.funcdef">2.2. Declaring Functions</h2>
+<p>Python has functions like most other languages, but it does not have separate header files like <abbr>C++</abbr> or <code>interface</code>/<code>implementation</code> sections like Pascal. When you need a function, just declare it, like this:
 <pre><code>
 def buildConnectionString(params):</pre><p>Note that the keyword <code>def</code> starts the function declaration, followed by the function name, followed by the arguments in parentheses. Multiple arguments
 (not shown here) are separated with commas.
@@ -661,7 +661,7 @@ In fact, every Python function returns a value; if the function ever executes a
 <p>The argument, <code>params</code>, doesn't specify a datatype. In Python, variables are never explicitly typed. Python figures out what type a variable is and keeps track of it internally.
 <table id="compare.funcdef.java" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In Java, <acronym>C++</acronym>, and other statically-typed languages, you must specify the datatype of the function return value and each function argument.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In Java, <abbr>C++</abbr>, and other statically-typed languages, you must specify the datatype of the function return value and each function argument.
        In Python, you never explicitly specify the datatype of anything. Based on what value you assign, Python keeps track of the datatype internally.
 <h3>2.2.1. How Python's Datatypes Compare to Other Programming Languages</h3>
 <p>An erudite reader sent me this explanation of how Python compares to other programming languages:
@@ -669,7 +669,7 @@ In fact, every Python function returns a value; if the function ever executes a
 <dl>
 <dt>statically typed language</dt>
 <dd>A language in which types are fixed at compile time. Most statically typed languages enforce this by requiring you to declare
-         all variables with their datatypes before using them. Java and <acronym>C</acronym> are statically typed languages.
+         all variables with their datatypes before using them. Java and <abbr>C</abbr> are statically typed languages.
 </dd>
 <dt>dynamically typed language</dt>
 <dd>A language in which types are discovered at execution time; the opposite of statically typed. VBScript and Python are dynamically typed, because they figure out what type a variable is when you first assign it a value.
@@ -698,7 +698,7 @@ def buildConnectionString(params):
 need to give your function a <code>docstring</code>, but you always should. I know you've heard this in every programming class you've ever taken, but Python gives you an added incentive: the <code>docstring</code> is available at runtime as an attribute of the function.
 <table id="tip.docstring" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Many Python <acronym>IDE</acronym>s use the <code>docstring</code> to provide context-sensitive documentation, so that when you type a function name, its <code>docstring</code> appears as a tooltip. This can be incredibly helpful, but it's only as good as the <code>docstring</code>s you write.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Many Python <abbr>IDE</abbr>s use the <code>docstring</code> to provide context-sensitive documentation, so that when you type a function name, its <code>docstring</code> appears as a tooltip. This can be incredibly helpful, but it's only as good as the <code>docstring</code>s you write.
 
 
 
@@ -712,7 +712,7 @@ need to give your function a <code>docstring</code>, but you always should. I kn
 if __name__ == "__main__":</pre><p>Some quick observations before you get to the good stuff. First, parentheses are not required around the <code>if</code> expression. Second, the <code>if</code> statement ends with a colon, and is followed by <a href="#odbchelper.indenting" title="2.5. Indenting Code">indented code</a>.
 <table id="compare.equals.c" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Like <acronym>C</acronym>, Python uses <code>==</code> for comparison and <code>=</code> for assignment. Unlike <acronym>C</acronym>, Python does not support in-line assignment, so there's no chance of accidentally assigning the value you thought you were comparing.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Like <abbr>C</abbr>, Python uses <code>==</code> for comparison and <code>=</code> for assignment. Unlike <abbr>C</abbr>, Python does not support in-line assignment, so there's no chance of accidentally assigning the value you thought you were comparing.
 <p>So why is this particular <code>if</code> statement a trick?  Modules are objects, and all modules have a built-in attribute <code>__name__</code>. A module's <code>__name__</code> depends on how you're using the module. If you <code>import</code> the module, then <code>__name__</code> is the module's filename, without a directory path or file extension. But you can also run the module directly as a standalone
 program, in which case <code>__name__</code> will be a special default value, <code>__main__</code>.
 <pre class=screen><samp class=prompt>>>> </samp><kbd>import odbchelper</kbd>
@@ -746,7 +746,7 @@ if __name__ == "__main__":
 <p>Also notice that the variable assignment is one command split over several lines, with a backslash (&#8220;<code>\</code>&#8221;) serving as a line-continuation marker.
 <table id="tip.multiline" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">When a command is split among several lines with the line-continuation marker (&#8220;<code>\</code>&#8221;), the continued lines can be indented in any manner; Python's normally stringent indentation rules do not apply. If your Python <acronym>IDE</acronym> auto-indents the continued line, you should probably accept its default unless you have a burning reason not to.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">When a command is split among several lines with the line-continuation marker (&#8220;<code>\</code>&#8221;), the continued lines can be indented in any manner; Python's normally stringent indentation rules do not apply. If your Python <abbr>IDE</abbr> auto-indents the continued line, you should probably accept its default unless you have a burning reason not to.
 <p><a name="tip.implicitmultiline"></a>Strictly speaking, expressions in parentheses, straight brackets, or curly braces (like <a href="#myparamsdef" title="Example 3.17. Defining the myParams Variable">defining a dictionary</a>) can be split into multiple lines with or without the line continuation character (&#8220;<code>\</code>&#8221;). I like to include the backslash even when it's not required because I think it makes the code easier to read, but that's
 a matter of style.
 <p>Third, you never declared the variable <var>myParams</var>, you just assigned a value to it. This is like VBScript without the <code>option explicit</code> option. Luckily, unlike VBScript, Python will not allow you to reference a variable that has never been assigned a value; trying to do so will raise an exception.
@@ -770,7 +770,7 @@ NameError: There is no variable named 'x'</samp>
 'e'</pre><div class=calloutlist>
 <ol>
 <li><var>v</var> is a tuple of three elements, and <code>(x, y, z)</code> is a tuple of three variables. Assigning one to the other assigns each of the values of <var>v</var> to each of the variables, in order.
-<p>This has all sorts of uses. I often want to assign names to a range of values. In <acronym>C</acronym>, you would use <code>enum</code> and manually list each constant and its associated value, which seems especially tedious when the values are consecutive.
+<p>This has all sorts of uses. I often want to assign names to a range of values. In <abbr>C</abbr>, you would use <code>enum</code> and manually list each constant and its associated value, which seems especially tedious when the values are consecutive.
    In Python, you can use the built-in <code>range</code> function with multi-variable assignment to quickly assign consecutive values.
 <div class=example><h3 id="odbchelper.multiassign.range">Example 3.20. Assigning Consecutive Values</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>range(7)</kbd>              <span>&#x2460;</span>
 [0, 1, 2, 3, 4, 5, 6]
@@ -784,7 +784,7 @@ NameError: There is no variable named 'x'</samp>
 <ol>
 <li>The built-in <code>range</code> function returns a list of integers. In its simplest form, it takes an upper limit and returns a zero-based list counting
                up to but not including the upper limit. (If you like, you can pass other parameters to specify a base other than <code>0</code> and a step other than <code>1</code>. You can <code>print range.__doc__</code> for details.)
-<li><var>MONDAY</var>, <var>TUESDAY</var>, <var>WEDNESDAY</var>, <var>THURSDAY</var>, <var>FRIDAY</var>, <var>SATURDAY</var>, and <var>SUNDAY</var> are the variables you're defining. (This example came from the <code>calendar</code> module, a fun little module that prints calendars, like the <acronym>UNIX</acronym> program <code>cal</code>. The <code>calendar</code> module defines integer constants for days of the week.)
+<li><var>MONDAY</var>, <var>TUESDAY</var>, <var>WEDNESDAY</var>, <var>THURSDAY</var>, <var>FRIDAY</var>, <var>SATURDAY</var>, and <var>SUNDAY</var> are the variables you're defining. (This example came from the <code>calendar</code> module, a fun little module that prints calendars, like the <abbr>UNIX</abbr> program <code>cal</code>. The <code>calendar</code> module defines integer constants for days of the week.)
 <li>Now each variable has its value: <var>MONDAY</var> is <code>0</code>, <var>TUESDAY</var> is <code>1</code>, and so forth.
 <p>You can also use multi-variable assignment to build functions that return multiple values, simply by returning a tuple of
    all the values. The caller can treat it as a tuple, or assign the values to individual variables. Many standard Python libraries do this, including the <code>os</code> module, which you'll discuss in <a href="#filehandling">Chapter 6</a>.
@@ -801,7 +801,7 @@ NameError: There is no variable named 'x'</samp>
    to insert values into a string with the <code>%s</code> placeholder.
 <table id="compare.stringformatting.c" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">String formatting in Python uses the same syntax as the <code>sprintf</code> function in <acronym>C</acronym>.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">String formatting in Python uses the same syntax as the <code>sprintf</code> function in <abbr>C</abbr>.
 <div class=example><h3>Example 3.21. Introducing String Formatting</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>k = "uid"</kbd>
 <samp class=prompt>>>> </samp><kbd>v = "sa"</kbd>
 <samp class=prompt>>>> </samp><kbd>"%s=%s" % (k, v)</kbd> <span>&#x2460;</span>
@@ -833,7 +833,7 @@ TypeError: cannot concatenate 'str' and 'int' objects</span></pre><div class=cal
 <li>String formatting works with integers by specifying <code>%d</code> instead of <code>%s</code>.
 <li>Trying to concatenate a string with a non-string raises an exception. Unlike string formatting, string concatenation works
             only when everything is already a string.
-<p>As with <code>printf</code> in <acronym>C</acronym>, string formatting in Python is like a Swiss Army knife. There are options galore, and modifier strings to specially format many different types of values.
+<p>As with <code>printf</code> in <abbr>C</abbr>, string formatting in Python is like a Swiss Army knife. There are options galore, and modifier strings to specially format many different types of values.
 <div class=example><h3 id="odbchelper.stringformatting.numbers">Example 3.23. Formatting Numbers</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>print "Today's stock price: %f" % 50.4625</kbd>   <span>&#x2460;</span>
 50.462500
@@ -852,7 +852,7 @@ TypeError: cannot concatenate 'str' and 'int' objects</span></pre><div class=cal
 <ul>
 <li><a href="http://www.python.org/doc/current/lib/"><i class=citetitle>Python Library Reference</i></a> summarizes <a href="http://www.python.org/doc/current/lib/typesseq-strings.html">all the string formatting format characters</a>.
 
-<li><a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Top"><i class=citetitle>Effective <acronym>AWK</acronym> Programming</i></a> discusses <a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Control+Letters">all the format characters</a> and advanced string formatting techniques like <a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Format+Modifiers">specifying width, precision, and zero-padding</a>.
+<li><a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Top"><i class=citetitle>Effective <abbr>AWK</abbr> Programming</i></a> discusses <a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Control+Letters">all the format characters</a> and advanced string formatting techniques like <a href="http://www-gnats.gnu.org:8080/cgi-bin/info2www?(gawk)Format+Modifiers">specifying width, precision, and zero-padding</a>.
 
 </ul>
 <h2 id="odbchelper.map">3.6. Mapping Lists</h2>
@@ -953,7 +953,7 @@ called <code>split</code>.
 
 <li><a href="http://www.python.org/doc/current/lib/"><i class=citetitle>Python Library Reference</i></a> documents the <a href="http://www.python.org/doc/current/lib/module-string.html"><code>string</code> module</a>.
 
-<li><a href="http://www.python.org/doc/FAQ.html"><i class=citetitle>The Whole Python <acronym>FAQ</acronym></i></a> explains <a href="http://www.python.org/cgi-bin/faqw.py?query=4.96&amp;querytype=simple&amp;casefold=yes&amp;req=search">why <code>join</code> is a string method</a> instead of a list method.
+<li><a href="http://www.python.org/doc/FAQ.html"><i class=citetitle>The Whole Python <abbr>FAQ</abbr></i></a> explains <a href="http://www.python.org/cgi-bin/faqw.py?query=4.96&amp;querytype=simple&amp;casefold=yes&amp;req=search">why <code>join</code> is a string method</a> instead of a list method.
 
 </ul>
 <h3>3.7.1. Historical Note on String Methods</h3>
@@ -981,9 +981,9 @@ if __name__ == "__main__":
 <p>Before diving into the next chapter, make sure you're comfortable doing all of these things:
 <div class=itemizedlist>
 <ul>
-<li>Using the Python <acronym>IDE</acronym> to test expressions interactively
+<li>Using the Python <abbr>IDE</abbr> to test expressions interactively
 
-<li>Writing Python programs and <a href="#odbchelper.testing" title="2.6. Testing Modules">running them from within your <acronym>IDE</acronym></a>, or from the command line
+<li>Writing Python programs and <a href="#odbchelper.testing" title="2.6. Testing Modules">running them from within your <abbr>IDE</abbr></a>, or from the command line
 
 <li><a href="#odbchelper.import" title="Example 2.3. Accessing the buildConnectionString Function's docstring">Importing modules</a> and calling their functions
 
@@ -1029,7 +1029,7 @@ if __name__ == "__main__":                <span>&#x2463;</span> <span>&#x2464;</
 <li>The <code>if __name__</code> <a href="#odbchelper.ifnametrick">trick</a> allows this program do something useful when run by itself, without interfering with its use as a module for other programs.
              In this case, the program simply prints out the <code>docstring</code> of the <code>info</code> function.
 <li><a href="#odbchelper.ifnametrick"><code>if</code> statements</a> use <code>==</code> for comparison, and parentheses are not required.
-<p>The <code>info</code> function is designed to be used by you, the programmer, while working in the Python <acronym>IDE</acronym>. It takes any object that has functions or methods (like a module, which has functions, or a list, which has methods) and
+<p>The <code>info</code> function is designed to be used by you, the programmer, while working in the Python <abbr>IDE</abbr>. It takes any object that has functions or methods (like a module, which has functions, or a list, which has methods) and
 prints out the functions and their <code>docstring</code>s.
 <div class=example><h3>Example 4.2. Sample Usage of <code>apihelper.py</code></h3><pre class=screen><samp class=prompt>>>> </samp><kbd>from apihelper import info</kbd>
 <samp class=prompt>>>> </samp><kbd>li = []</kbd>
@@ -1054,7 +1054,7 @@ buildConnectionString          Build a connection string from a dictionary Retur
     Returns string.
 </span></pre><h2 id="apihelper.optional">4.2. Using Optional and Named Arguments</h2>
 <p>Python allows function arguments to have default values; if the function is called without the argument, the argument gets its default
-   value. Futhermore, arguments can be specified in any order by using named arguments. Stored procedures in SQL Server Transact/<acronym>SQL</acronym> can do this, so if you're a SQL Server scripting guru, you can skim this part.
+   value. Futhermore, arguments can be specified in any order by using named arguments. Stored procedures in SQL Server Transact/<abbr>SQL</abbr> can do this, so if you're a SQL Server scripting guru, you can skim this part.
 
 <p>Here is an example of <code>info</code>, a function with two optional arguments:<pre><code>
 def info(object, spacing=10, collapse=1):</pre><p><var>spacing</var> and <var>collapse</var> are optional, because they have default values defined. <var>object</var> is required, because it has no default value. If <code>info</code> is called with only one argument, <var>spacing</var> defaults to <code>10</code> and <var>collapse</var> defaults to <code>1</code>. If <code>info</code> is called with two arguments, <var>collapse</var> still defaults to <code>1</code>.
@@ -1247,7 +1247,7 @@ True</pre><div class=calloutlist>
 <h3>4.4.2. <code>getattr</code> As a Dispatcher</h3>
 <p>A common usage pattern of <code>getattr</code> is as a dispatcher. For example, if you had a program that could output data in a variety of different formats, you could
    define separate functions for each output format and use a single dispatch function to call the right one.
-<p>For example, let's imagine a program that prints site statistics in <acronym>HTML</acronym>, <acronym>XML</acronym>, and plain text formats. The choice of output format could be specified on the command line, or stored in a configuration
+<p>For example, let's imagine a program that prints site statistics in <abbr>HTML</abbr>, <abbr>XML</abbr>, and plain text formats. The choice of output format could be specified on the command line, or stored in a configuration
    file. A <code>statsout</code> module defines three functions, <code>output_html</code>, <code>output_xml</code>, and <code>output_text</code>. Then the main program defines a single output function, like this:
 <div class=example><h3 id="apihelper.getattr.dispatch">Example 4.12. Creating a Dispatcher with <code>getattr</code></h3><pre><code>
 import statsout
@@ -1345,7 +1345,7 @@ the <code>pop</code> method of a list) and user-defined (like the <code>buildCon
 <li>If all values are false, <code>or</code> returns the last value. <code>or</code> evaluates <code>''</code>, which is false, then <code>[]</code>, which is false, then <code>{}</code>, which is false, and returns <code>{}</code>.
 <li>Note that <code>or</code> evaluates values only until it finds one that is true in a boolean context, and then it ignores the rest. This distinction
             is important if some values can have side effects. Here, the function <code>sidefx</code> is never called, because <code>or</code> evaluates <code>'a'</code>, which is true, and returns <code>'a'</code> immediately.
-<p>If you're a <acronym>C</acronym> hacker, you are certainly familiar with the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> expression, which evaluates to <var>a</var> if <var><code>bool</code></var> is true, and <var>b</var> otherwise. Because of the way <code>and</code> and <code>or</code> work in Python, you can accomplish the same thing.
+<p>If you're a <abbr>C</abbr> hacker, you are certainly familiar with the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> expression, which evaluates to <var>a</var> if <var><code>bool</code></var> is true, and <var>b</var> otherwise. Because of the way <code>and</code> and <code>or</code> work in Python, you can accomplish the same thing.
 <h3>4.6.1. Using the <code>and-or</code> Trick</h3>
 <div class=example><h3 id="apihelper.andortrick.intro">Example 4.17. Introducing the <code>and-or</code> Trick</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>a = "first"</kbd>
 <samp class=prompt>>>> </samp><kbd>b = "second"</kbd>
@@ -1355,17 +1355,17 @@ the <code>pop</code> method of a list) and user-defined (like the <code>buildCon
 'second'
 </pre><div class=calloutlist>
 <ol>
-<li>This syntax looks similar to the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> expression in <acronym>C</acronym>. The entire expression is evaluated from left to right, so the <code>and</code> is evaluated first. <code>1 and 'first'</code> evalutes to <code>'first'</code>, then <code>'first' or 'second'</code> evalutes to <code>'first'</code>.
+<li>This syntax looks similar to the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> expression in <abbr>C</abbr>. The entire expression is evaluated from left to right, so the <code>and</code> is evaluated first. <code>1 and 'first'</code> evalutes to <code>'first'</code>, then <code>'first' or 'second'</code> evalutes to <code>'first'</code>.
 <li><code>0 and 'first'</code> evalutes to <code>False</code>, and then <code>0 or 'second'</code> evaluates to <code>'second'</code>.
 <p>However, since this Python expression is simply boolean logic, and not a special construct of the language, there is one extremely important difference
-   between this <code>and-or</code> trick in Python and the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> syntax in <acronym>C</acronym>. If the value of <var>a</var> is false, the expression will not work as you would expect it to. (Can you tell I was bitten by this?  More than once?)
+   between this <code>and-or</code> trick in Python and the <code><var>bool</var> ? <var>a</var> : <var>b</var></code> syntax in <abbr>C</abbr>. If the value of <var>a</var> is false, the expression will not work as you would expect it to. (Can you tell I was bitten by this?  More than once?)
 <div class=example><h3>Example 4.18. When the <code>and-or</code> Trick Fails</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>a = ""</kbd>
 <samp class=prompt>>>> </samp><kbd>b = "second"</kbd>
 <samp class=prompt>>>> </samp><kbd>1 and a or b</kbd>         <span>&#x2460;</span>
 'second'</pre><div class=calloutlist>
 <ol>
 <li>Since <var>a</var> is an empty string, which Python considers false in a boolean context, <code>1 and ''</code> evalutes to <code>''</code>, and then <code>'' or 'second'</code> evalutes to <code>'second'</code>. Oops!  That's not what you wanted.
-<p>The <code>and-or</code> trick, <code><var>bool</var> and <var>a</var> or <var>b</var></code>, will not work like the <acronym>C</acronym> expression <code><var>bool</var> ? <var>a</var> : <var>b</var></code> when <var>a</var> is false in a boolean context.
+<p>The <code>and-or</code> trick, <code><var>bool</var> and <var>a</var> or <var>b</var></code>, will not work like the <abbr>C</abbr> expression <code><var>bool</var> ? <var>a</var> : <var>b</var></code> when <var>a</var> is false in a boolean context.
 <p>The real trick behind the <code>and-or</code> trick, then, is to make sure that the value of <var>a</var> is never false. One common way of doing this is to turn <var>a</var> into <code>[<var>a</var>]</code> and <var>b</var> into <code>[<var>b</var>]</code>, then taking the first element of the returned list, which will be either <var>a</var> or <var>b</var>.
 <div class=example><h3>Example 4.19. Using the <code>and-or</code> Trick Safely</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>a = ""</kbd>
 <samp class=prompt>>>> </samp><kbd>b = "second"</kbd>
@@ -1436,9 +1436,9 @@ a	test</samp>
 <ul>
 <li><a href="http://www.faqts.com/knowledge-base/index.phtml/fid/199/">Python Knowledge Base</a> discusses using <code>lambda</code> to <a href="http://www.faqts.com/knowledge-base/view.phtml/aid/6081/fid/241">call functions indirectly</a>.
 
-<li><a href="http://www.python.org/doc/current/tut/tut.html"><i class=citetitle>Python Tutorial</i></a> shows how to <a href="http://www.python.org/doc/current/tut/node6.html#SECTION006740000000000000000">access outside variables from inside a <code>lambda</code> function</a>. (<a href="http://python.sourceforge.net/peps/pep-0227.html"><acronym>PEP</acronym> 227</a> explains how this will change in future versions of Python.)
+<li><a href="http://www.python.org/doc/current/tut/tut.html"><i class=citetitle>Python Tutorial</i></a> shows how to <a href="http://www.python.org/doc/current/tut/node6.html#SECTION006740000000000000000">access outside variables from inside a <code>lambda</code> function</a>. (<a href="http://python.sourceforge.net/peps/pep-0227.html"><abbr>PEP</abbr> 227</a> explains how this will change in future versions of Python.)
 
-<li><a href="http://www.python.org/doc/FAQ.html"><i class=citetitle>The Whole Python <acronym>FAQ</acronym></i></a> has examples of <a href="http://www.python.org/cgi-bin/faqw.py?query=4.15&amp;querytype=simple&amp;casefold=yes&amp;req=search">obfuscated one-liners using <code>lambda</code></a>.
+<li><a href="http://www.python.org/doc/FAQ.html"><i class=citetitle>The Whole Python <abbr>FAQ</abbr></i></a> has examples of <a href="http://www.python.org/cgi-bin/faqw.py?query=4.15&amp;querytype=simple&amp;casefold=yes&amp;req=search">obfuscated one-liners using <code>lambda</code></a>.
 
 </ul>
 <h2 id="apihelper.alltogether">4.8. Putting It All Together</h2>
@@ -1479,12 +1479,12 @@ True
 'None'
 </pre><div class=calloutlist>
 <ol>
-<li>You can easily define a function that has no <code>docstring</code>, so its <code>__doc__</code> attribute is <code>None</code>. Confusingly, if you evaluate the <code>__doc__</code> attribute directly, the Python <acronym>IDE</acronym> prints nothing at all, which makes sense if you think about it, but is still unhelpful.
+<li>You can easily define a function that has no <code>docstring</code>, so its <code>__doc__</code> attribute is <code>None</code>. Confusingly, if you evaluate the <code>__doc__</code> attribute directly, the Python <abbr>IDE</abbr> prints nothing at all, which makes sense if you think about it, but is still unhelpful.
 <li>You can verify that the value of the <code>__doc__</code> attribute is actually <code>None</code> by comparing it directly.
 <li>The <code>str</code> function takes the null value and returns a string representation of it, <code>'None'</code>.
 <table id="compare.isnull.sql" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In <acronym>SQL</acronym>, you must use <code>IS NULL</code> instead of <code>= NULL</code> to compare a null value. In Python, you can use either <code>== None</code> or <code>is None</code>, but <code>is None</code> is faster.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In <abbr>SQL</abbr>, you must use <code>IS NULL</code> instead of <code>= NULL</code> to compare a null value. In Python, you can use either <code>== None</code> or <code>is None</code>, but <code>is None</code> is faster.
 <p>Now that you are guaranteed to have a string, you can pass the string to <var>processFunc</var>, which you have <a href="#apihelper.lambda" title="4.7. Using lambda Functions">already defined</a> as a function that either does or doesn't collapse whitespace. Now you see why it was important to use <code>str</code> to convert a <code>None</code> value into a string representation. <var>processFunc</var> is assuming a string argument and calling its <code>split</code> method, which would crash if you passed it <code>None</code> because <code>None</code> doesn't have a <code>split</code> method.
 <p>Stepping back even further, you see that you're using string formatting again to concatenate the return value of <var>processFunc</var> with the return value of <var>method</var>'s <code>ljust</code> method. This is a new string method that you haven't seen before.
 <div class=example><h3>Example 4.24. Introducing <code>ljust</code></h3><pre class=screen><samp class=prompt>>>> </samp><kbd>s = 'buildConnectionString'</kbd>
@@ -1703,7 +1703,7 @@ can import individual items or use <code>from <var>module</var> import *</code>
 <table id="compare.fromimport.java" class=note border="0" summary="">
 
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%"><code>from <var>module</var> import *</code> in Python is like <code>import <var>module</var>.*</code> in Java; <code>import <var>module</var></code> in Python is like <code>import <var>module</var></code> in Java.
-<div class=example><h3>Example 5.2. <code>import <var>module</var></code> <i class=foreignphrase><acronym>vs.</acronym></i> <code>from <var>module</var> import</code></h3><pre class=screen><samp class=prompt>>>> </samp><kbd>import types</kbd>
+<div class=example><h3>Example 5.2. <code>import <var>module</var></code> <i class=foreignphrase><abbr>vs.</abbr></i> <code>from <var>module</var> import</code></h3><pre class=screen><samp class=prompt>>>> </samp><kbd>import types</kbd>
 <samp class=prompt>>>> </samp><kbd>types.FunctionType</kbd>             <span>&#x2460;</span>
 &lt;type 'function'>
 <samp class=prompt>>>> </samp><kbd>FunctionType</kbd> <span>&#x2461;</span>
@@ -1736,7 +1736,7 @@ NameError: There is no variable named 'FunctionType'</samp>
 <div class=itemizedlist>
 <h3>Further Reading on Module Importing Techniques</h3>
 <ul>
-<li><a href="http://www.effbot.org/guides/">eff-bot</a> has more to say on <a href="http://www.effbot.org/guides/import-confusion.htm"><code>import <var>module</var></code> <i class=foreignphrase><acronym>vs.</acronym></i> <code>from <var>module</var> import</code></a>.
+<li><a href="http://www.effbot.org/guides/">eff-bot</a> has more to say on <a href="http://www.effbot.org/guides/import-confusion.htm"><code>import <var>module</var></code> <i class=foreignphrase><abbr>vs.</abbr></i> <code>from <var>module</var> import</code></a>.
 
 <li><a href="http://www.python.org/doc/current/tut/tut.html"><i class=citetitle>Python Tutorial</i></a> discusses advanced import techniques, including <a href="http://www.python.org/doc/current/tut/node8.html#SECTION008410000000000000000"><code>from <var>module</var> import *</code></a>.
 
@@ -1756,10 +1756,10 @@ class Loaf: <span>&#x2460;</span>
 <li>You probably guessed this, but everything in a class is indented, just like the code within a function, <code>if</code> statement, <code>for</code> loop, and so forth. The first thing not indented is not in the class.
 <table id="compare.pass.java" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">The <code>pass</code> statement in Python is like an empty set of braces (<code>{}</code>) in Java or <acronym>C</acronym>.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">The <code>pass</code> statement in Python is like an empty set of braces (<code>{}</code>) in Java or <abbr>C</abbr>.
 <p>Of course, realistically, most classes will be inherited from other classes, and they will define their own class methods
 and attributes. But as you've just seen, there is nothing that a class absolutely must have, other than a name. In particular,
-<acronym>C++</acronym> programmers may find it odd that Python classes don't have explicit constructors and destructors. Python classes do have something similar to a constructor: the <code>__init__</code> method.
+<abbr>C++</abbr> programmers may find it odd that Python classes don't have explicit constructors and destructors. Python classes do have something similar to a constructor: the <code>__init__</code> method.
 <div class=example><h3 id="fileinfo.class.example">Example 5.4. Defining the <code>FileInfo</code> Class</h3><pre><code>
 from UserDict import UserDict
 
@@ -1791,7 +1791,7 @@ class FileInfo(UserDict):
                them optional to the caller. In this case, <var>filename</var> has a default value of <code>None</code>, which is the Python null value.
 <table id="compare.self.java" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">By convention, the first argument of any Python class method (the reference to the current instance) is called <code>self</code>. This argument fills the role of the reserved word <code>this</code> in <acronym>C++</acronym> or Java, but <code>self</code> is not a reserved word in Python, merely a naming convention. Nonetheless, please don't call it anything but <code>self</code>; this is a very strong convention.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">By convention, the first argument of any Python class method (the reference to the current instance) is called <code>self</code>. This argument fills the role of the reserved word <code>this</code> in <abbr>C++</abbr> or Java, but <code>self</code> is not a reserved word in Python, merely a naming convention. Nonetheless, please don't call it anything but <code>self</code>; this is a very strong convention.
 <div class=example><h3 id="fileinfo.init.code.example">Example 5.6. Coding the <code>FileInfo</code> Class</h3><pre><code>
 class FileInfo(UserDict):
     "store file metadata"
@@ -1844,7 +1844,7 @@ class FileInfo(UserDict):
 <li>Remember when the <code>__init__</code> method <a href="#fileinfo.class.example" title="Example 5.4. Defining the FileInfo Class">assigned its <var>filename</var> argument to <code>self["name"]</code></a>?  Well, here's the result. The arguments you pass when you create the class instance get sent right along to the <code>__init__</code> method (along with the object reference, <code>self</code>, which Python adds for free).
 <table id="compare.new.java" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In Python, simply call a class as if it were a function to create a new instance of the class. There is no explicit <code>new</code> operator like <acronym>C++</acronym> or Java.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In Python, simply call a class as if it were a function to create a new instance of the class. There is no explicit <code>new</code> operator like <abbr>C++</abbr> or Java.
 <h3>5.4.1. Garbage Collection</h3>
 <p>If creating new instances is easy, destroying them is even easier. In general, there is no need to explicitly free instances,
    because they are freed automatically when the variables assigned to them go out of scope. Memory leaks are rare in Python.
@@ -1874,7 +1874,7 @@ class FileInfo(UserDict):
 <p>As you've seen, <code>FileInfo</code> is a class that acts like a dictionary. To explore this further, let's look at the <code>UserDict</code> class in the <code>UserDict</code> module, which is the ancestor of the <code>FileInfo</code> class. This is nothing special; the class is written in Python and stored in a <code>.py</code> file, just like any other Python code. In particular, it's stored in the <code>lib</code> directory in your Python installation.
 <table id="tip.locate" class=tip border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <acronym>IDE</acronym> on Windows, you can quickly open any module in your library path by selecting
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <abbr>IDE</abbr> on Windows, you can quickly open any module in your library path by selecting
 File->Locate... (<kbd class=shortcut>Ctrl-L</kbd>).
 <div class=example><h3 id="fileinfo.userdict.init.example">Example 5.9. Defining the <code>UserDict</code> Class</h3><pre><code>
 class UserDict:              <span>&#x2460;</span>
@@ -1887,24 +1887,24 @@ class UserDict:              <span>&#x2460;</span>
 <li>This is the <code>__init__</code> method that you <a href="#fileinfo.class.example" title="Example 5.4. Defining the FileInfo Class">overrode in the <code>FileInfo</code> class</a>. Note that the argument list in this ancestor class is different than the descendant. That's okay; each subclass can have
             its own set of arguments, as long as it calls the ancestor with the correct arguments. Here the ancestor class has a way
             to define initial values (by passing a dictionary in the <var>dict</var> argument) which the <code>FileInfo</code> does not use.
-<li>Python supports data attributes (called &#8220;instance variables&#8221; in Java and Powerbuilder, and &#8220;member variables&#8221; in <acronym>C++</acronym>). Data attributes are pieces of data held by a specific instance of a class. In this case, each instance of <code>UserDict</code> will have a data attribute <var>data</var>. To reference this attribute from code outside the class, you qualify it with the instance name, <code><var>instance</var>.data</code>, in the same way that you qualify a function with its module name. To reference a data attribute from within the class,
+<li>Python supports data attributes (called &#8220;instance variables&#8221; in Java and Powerbuilder, and &#8220;member variables&#8221; in <abbr>C++</abbr>). Data attributes are pieces of data held by a specific instance of a class. In this case, each instance of <code>UserDict</code> will have a data attribute <var>data</var>. To reference this attribute from code outside the class, you qualify it with the instance name, <code><var>instance</var>.data</code>, in the same way that you qualify a function with its module name. To reference a data attribute from within the class,
             you use <code>self</code> as the qualifier. By convention, all data attributes are initialized to reasonable values in the <code>__init__</code> method. However, this is not required, since data attributes, like local variables, <a href="#odbchelper.vardef" title="3.4. Declaring variables">spring into existence</a> when they are first assigned a value.
 <li>The <code>update</code> method is a dictionary duplicator: it copies all the keys and values from one dictionary to another. This does <em>not</em> clear the target dictionary first; if the target dictionary already has some keys, the ones from the source dictionary will
             be overwritten, but others will be left untouched. Think of <code>update</code> as a merge function, not a copy function.
 <li>This is a syntax you may not have seen before (I haven't used it in the examples in this book). It's an <code>if</code> statement, but instead of having an indented block starting on the next line, there is just a single statement on the same
             line, after the colon. This is perfectly legal syntax, which is just a shortcut you can use when you have only one statement
-            in a block. (It's like specifying a single statement without braces in <acronym>C++</acronym>.)  You can use this syntax, or you can have indented code on subsequent lines, but you can't do both for the same block.
+            in a block. (It's like specifying a single statement without braces in <abbr>C++</abbr>.)  You can use this syntax, or you can have indented code on subsequent lines, but you can't do both for the same block.
 <table id="compare.overloading" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Java and Powerbuilder support function overloading by argument list, <i class=foreignphrase><acronym>i.e.</acronym></i> one class can have multiple methods with the same name but a different number of arguments, or arguments of different types.
-       Other languages (most notably <acronym>PL/SQL</acronym>) even support function overloading by argument name; <i class=foreignphrase><acronym>i.e.</acronym></i> one class can have multiple methods with the same name and the same number of arguments of the same type but different argument
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Java and Powerbuilder support function overloading by argument list, <i class=foreignphrase><abbr>i.e.</abbr></i> one class can have multiple methods with the same name but a different number of arguments, or arguments of different types.
+       Other languages (most notably <abbr>PL/SQL</abbr>) even support function overloading by argument name; <i class=foreignphrase><abbr>i.e.</abbr></i> one class can have multiple methods with the same name and the same number of arguments of the same type but different argument
       names. Python supports neither of these; it has no form of function overloading whatsoever. Methods are defined solely by their name,
       and there can be only one method per class with a given name. So if a descendant class has an <code>__init__</code> method, it <em>always</em> overrides the ancestor <code>__init__</code> method, even if the descendant defines it with a different argument list. And the same rule applies to any other method.
 <table id="fileinfo.derivedclasses" class=note border="0" summary="">
 
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Guido, the original author of Python, explains method overriding this way: "Derived classes may override methods of their base classes. Because methods have no
       special privileges when calling other methods of the same object, a method of a base class that calls another method defined
-      in the same base class, may in fact end up calling a method of a derived class that overrides it. (For <acronym>C++</acronym> programmers: all methods in Python are effectively virtual.)"  If that doesn't make sense to you (it confuses the hell out of me), feel free to ignore it. 
+      in the same base class, may in fact end up calling a method of a derived class that overrides it. (For <abbr>C++</abbr> programmers: all methods in Python are effectively virtual.)"  If that doesn't make sense to you (it confuses the hell out of me), feel free to ignore it. 
       I just thought I'd pass it along.
 <table id="note.dataattributes" class=caution border="0" summary="">
 
@@ -2190,7 +2190,7 @@ AttributeError: 'MP3FileInfo' instance has no attribute '__parse'</span></pre><d
 <p>Like many other programming languages, Python has exception handling via <code>try...except</code> blocks.
 <table id="compare.exceptions.java" class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Python uses <code>try...except</code> to handle exceptions and <code>raise</code> to generate them. Java and <acronym>C++</acronym> use <code>try...catch</code> to handle exceptions, and <code>throw</code> to generate them.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Python uses <code>try...except</code> to handle exceptions and <code>raise</code> to generate them. Java and <abbr>C++</abbr> use <code>try...catch</code> to handle exceptions, and <code>throw</code> to generate them.
 <p>Exceptions are everywhere in Python. Virtually every module in the standard Python library uses them, and Python itself will raise them in a lot of different circumstances. You've already seen them repeatedly throughout this book.
 <div class=itemizedlist>
 <ul>
@@ -2205,8 +2205,8 @@ AttributeError: 'MP3FileInfo' instance has no attribute '__parse'</span></pre><d
 <li><a href="#odbchelper.stringformatting.coerce" title="Example 3.22. String Formatting vs. Concatenating">Mixing datatypes without coercion</a> will raise a <code>TypeError</code> exception.
 
 </ul>
-<p>In each of these cases, you were simply playing around in the Python <acronym>IDE</acronym>: an error occurred, the exception was printed (depending on your <acronym>IDE</acronym>, perhaps in an intentionally jarring shade of red), and that was that. This is called an <em>unhandled</em> exception. When the exception was raised, there was no code to explicitly notice it and deal with it, so it bubbled its
-way back to the default behavior built in to Python, which is to spit out some debugging information and give up. In the <acronym>IDE</acronym>, that's no big deal, but if that happened while your actual Python program was running, the entire program would come to a screeching halt.
+<p>In each of these cases, you were simply playing around in the Python <abbr>IDE</abbr>: an error occurred, the exception was printed (depending on your <abbr>IDE</abbr>, perhaps in an intentionally jarring shade of red), and that was that. This is called an <em>unhandled</em> exception. When the exception was raised, there was no code to explicitly notice it and deal with it, so it bubbled its
+way back to the default behavior built in to Python, which is to spit out some debugging information and give up. In the <abbr>IDE</abbr>, that's no big deal, but if that happened while your actual Python program was running, the entire program would come to a screeching halt.
 <p>An exception doesn't need result in a complete program crash, though. Exceptions, when raised, can be <em>handled</em>. Sometimes an exception is really because you have a bug in your code (like accessing a variable that doesn't exist), but
 many times, an exception is something you can anticipate. If you're opening a file, it might not exist. If you're connecting
 to a database, it might be unavailable, or you might not have the correct security credentials to access it. If you know
@@ -2239,7 +2239,7 @@ exceptions, errors occur immediately, and you can handle them in a standard way
    or to support multiple platforms (where platform-specific code is separated into different modules).
 <p>You can also define your own exceptions by creating a class that inherits from the built-in <code>Exception</code> class, and then raise your exceptions with the <code>raise</code> command. See the further reading section if you're interested in doing this.
 <p>The next example demonstrates how to use an exception to support platform-specific functionality. This code comes from the
-<code>getpass</code> module, a wrapper module for getting a password from the user. Getting a password is accomplished differently on <acronym>UNIX</acronym>, Windows, and Mac OS platforms, but this code encapsulates all of those differences.
+<code>getpass</code> module, a wrapper module for getting a password from the user. Getting a password is accomplished differently on <abbr>UNIX</abbr>, Windows, and Mac OS platforms, but this code encapsulates all of those differences.
 <div class=example><h3 id="crossplatform.example">Example 6.2. Supporting Platform-Specific Functionality</h3><pre><code>
   # Bind the name getpass to the appropriate function
   try:
@@ -2259,9 +2259,9 @@ exceptions, errors occur immediately, and you can handle them in a standard way
   else:
       getpass = unix_getpass</pre><div class=calloutlist>
 <ol>
-<li><code>termios</code> is a <acronym>UNIX</acronym>-specific module that provides low-level control over the input terminal. If this module is not available (because it's not
+<li><code>termios</code> is a <abbr>UNIX</abbr>-specific module that provides low-level control over the input terminal. If this module is not available (because it's not
                on your system, or your system doesn't support it), the import fails and Python raises an <code>ImportError</code>, which you catch.
-<li>OK, you didn't have <code>termios</code>, so let's try <code>msvcrt</code>, which is a Windows-specific module that provides an <acronym>API</acronym> to many useful functions in the Microsoft Visual C++ runtime services. If this import fails, Python will raise an <code>ImportError</code>, which you catch.
+<li>OK, you didn't have <code>termios</code>, so let's try <code>msvcrt</code>, which is a Windows-specific module that provides an <abbr>API</abbr> to many useful functions in the Microsoft Visual C++ runtime services. If this import fails, Python will raise an <code>ImportError</code>, which you catch.
 <li>If the first two didn't work, you try to import a function from <code>EasyDialogs</code>, which is a Mac OS-specific module that provides functions to pop up dialog boxes of various types. Once again, if this import fails, Python will raise an <code>ImportError</code>, which you catch.
 <li>None of these platform-specific modules is available (which is possible, since Python has been ported to a lot of different platforms), so you need to fall back on a default password input function (which is
                defined elsewhere in the <code>getpass</code> module). Notice what you're doing here: assigning the function <code>default_getpass</code> to the variable <var>getpass</var>. If you read the official <code>getpass</code> documentation, it tells you that the <code>getpass</code> module defines a <code>getpass</code> function. It does this by binding <var>getpass</var> to the correct function for your platform. Then when you call the <code>getpass</code> function, you're really calling a platform-specific function that this code has set up for you. You don't need to know or
@@ -2358,7 +2358,7 @@ ValueError: I/O operation on closed file</samp>
 <li>Just because a file is closed doesn't mean that the file object ceases to exist. The variable <var>f</var> will continue to exist until it <a href="#fileinfo.scope" title="Example 5.8. Trying to Implement a Memory Leak">goes out of scope</a> or gets manually deleted. However, none of the methods that manipulate an open file will work once the file has been closed;
                they all raise an exception.
 <li>Calling <code>close</code> on a file object whose file is already closed does <em>not</em> raise an exception; it fails silently.
-<h3>6.2.3. Handling <acronym>I/O</acronym> Errors</h3>
+<h3>6.2.3. Handling <abbr>I/O</abbr> Errors</h3>
 <p>Now you've seen enough to understand the file handling code in the <code>fileinfo.py</code> sample code from teh previous chapter. This example shows how to safely open and read from a file and gracefully handle
    errors.
 <div class=example><h3 id="fileinfo.files.incode">Example 6.6. File Objects in <code>MP3FileInfo</code></h3><pre><code>
@@ -2486,7 +2486,7 @@ USERNAME=mpilgrim
 [...snip...]</span></pre><div class=calloutlist>
 <ol>
 <li><var>os.environ</var> is a dictionary of the environment variables defined on your system. In Windows, these are your user and system variables
-            accessible from <acronym>MS-DOS</acronym>. In <acronym>UNIX</acronym>, they are the variables exported in your shell's startup scripts. In Mac OS, there is no concept of environment variables, so this dictionary is empty.
+            accessible from <abbr>MS-DOS</abbr>. In <abbr>UNIX</abbr>, they are the variables exported in your shell's startup scripts. In Mac OS, there is no concept of environment variables, so this dictionary is empty.
 <li><code>os.environ.items()</code> returns a list of tuples: <code>[(<var>key1</var>, <var>value1</var>), (<var>key2</var>, <var>value2</var>), ...]</code>. The <code>for</code> loop iterates through this list. The first round, it assigns <code><var>key1</var></code> to <var>k</var> and <code><var>value1</var></code> to <var>v</var>, so <var>k</var> = <code>USERPROFILE</code> and <var>v</var> = <code>C:\Documents and Settings\mpilgrim</code>. In the second round, <var>k</var> gets the second key, <code>OS</code>, and <var>v</var> gets the corresponding value, <code>Windows_NT</code>.
 <li>With <a href="#odbchelper.multiassign" title="3.4.2. Assigning Multiple Values at Once">multi-variable assignment</a> and <a href="#odbchelper.map" title="3.6. Mapping Lists">list comprehensions</a>, you can replace the entire <code>for</code> loop with a single statement. Whether you actually do this in real code is a matter of personal coding style. I like it
             because it makes it clear that what I'm doing is mapping a dictionary into a list, then joining the list into a single string.
@@ -2530,7 +2530,7 @@ UserDict
 stat</span></pre><div class=calloutlist>
 <ol>
 <li>The <code>sys</code> module contains system-level information, such as the version of Python you're running (<code><code>sys</code>.version</code> or <code><code>sys</code>.version_info</code>), and system-level options such as the maximum allowed recursion depth (<code><code>sys</code>.getrecursionlimit()</code> and <code><code>sys</code>.setrecursionlimit()</code>).
-<li><code><code>sys</code>.modules</code> is a dictionary containing all the modules that have ever been imported since Python was started; the key is the module name, the value is the module object. Note that this is more than just the modules <em>your</em> program has imported. Python preloads some modules on startup, and if you're using a Python <acronym>IDE</acronym>, <code><code>sys</code>.modules</code> contains all the modules imported by all the programs you've run within the <acronym>IDE</acronym>.
+<li><code><code>sys</code>.modules</code> is a dictionary containing all the modules that have ever been imported since Python was started; the key is the module name, the value is the module object. Note that this is more than just the modules <em>your</em> program has imported. Python preloads some modules on startup, and if you're using a Python <abbr>IDE</abbr>, <code><code>sys</code>.modules</code> contains all the modules imported by all the programs you've run within the <abbr>IDE</abbr>.
 <p>This example demonstrates how to use <code><code>sys</code>.modules</code>.
 <div class=example><h3>Example 6.13. Using <code><code>sys</code>.modules</code></h3><pre class=screen><samp class=prompt>>>> </samp><kbd>import fileinfo</kbd>         <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>print '\n'.join(sys.modules.keys())</kbd>
@@ -2604,7 +2604,7 @@ stat</samp>
 <li>In this slightly less trivial case, <code>join</code> will add an extra backslash to the pathname before joining it to the filename. I was overjoyed when I discovered this, since
 <code>addSlashIfNecessary</code> is one of the stupid little functions I always need to write when building up my toolbox in a new language. <em>Do not</em> write this stupid little function in Python; smart people have already taken care of it for you.
 <li><code>expanduser</code> will expand a pathname that uses <code>~</code> to represent the current user's home directory. This works on any platform where users have a home directory, like Windows,
-<acronym>UNIX</acronym>, and Mac OS X; it has no effect on Mac OS.
+<abbr>UNIX</abbr>, and Mac OS X; it has no effect on Mac OS.
 <li>Combining these techniques, you can easily construct pathnames for directories and files under the user's home directory.
 <div class=example><h3 id="splittingpathnames.example">Example 6.17. Splitting Pathnames</h3><pre class=screen><samp class=prompt>>>> </samp><kbd>os.path.split("c:\\music\\ap\\mahadeva.mp3")</kbd>      <span>&#x2460;</span>
 ('c:\\music\\ap', 'mahadeva.mp3')
@@ -2662,14 +2662,14 @@ def listDirectory(directory, fileExtList):
                 if os.path.splitext(f)[1] in fileExtList]  <span>&#x2462;</span> <span>&#x2463;</span> <span>&#x2464;</span></pre><div class=calloutlist>
 <ol>
 <li><code>os.listdir(directory)</code> returns a list of all the files and folders in <var>directory</var>.
-<li>Iterating through the list with <var>f</var>, you use <code>os.path.normcase(f)</code> to normalize the case according to operating system defaults. <code>normcase</code> is a useful little function that compensates for case-insensitive operating systems that think that <code>mahadeva.mp3</code> and <code>mahadeva.MP3</code> are the same file. For instance, on Windows and Mac OS, <code>normcase</code> will convert the entire filename to lowercase; on <acronym>UNIX</acronym>-compatible systems, it will return the filename unchanged.
+<li>Iterating through the list with <var>f</var>, you use <code>os.path.normcase(f)</code> to normalize the case according to operating system defaults. <code>normcase</code> is a useful little function that compensates for case-insensitive operating systems that think that <code>mahadeva.mp3</code> and <code>mahadeva.MP3</code> are the same file. For instance, on Windows and Mac OS, <code>normcase</code> will convert the entire filename to lowercase; on <abbr>UNIX</abbr>-compatible systems, it will return the filename unchanged.
 <li>Iterating through the normalized list with <var>f</var> again, you use <code>os.path.splitext(f)</code> to split each filename into name and extension.
 <li>For each file, you see if the extension is in the list of file extensions you care about (<var>fileExtList</var>, which was passed to the <code>listDirectory</code> function).
 <li>For each file you care about, you use <code>os.path.join(directory, f)</code> to construct the full pathname of the file, and return a list of the full pathnames.
 <table id="tip.os" class=note border="0" summary="">
 
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Whenever possible, you should use the functions in <code>os</code> and <code>os.path</code> for file, directory, and path manipulations. These modules are wrappers for platform-specific modules, so functions like
-<code>os.path.split</code> work on <acronym>UNIX</acronym>, Windows, Mac OS, and any other platform supported by Python.
+<code>os.path.split</code> work on <abbr>UNIX</abbr>, Windows, Mac OS, and any other platform supported by Python.
 <p>There is one other way to get the contents of a directory. It's very powerful, and it uses the sort of wildcards that you
 may already be familiar with from working on the command line.
 <div class=example><h3 id="fileinfo.os.glob.example">Example 6.20. Listing Directories with <code>glob</code></h3><pre class=screen>
@@ -2735,7 +2735,7 @@ def listDirectory(directory, fileExtList):     <span>&#x2460;</span>
 <p>Note that <code>listDirectory</code> is completely generic. It doesn't know ahead of time which types of files it will be getting, or which classes are defined
 that could potentially handle those files. It inspects the directory for the files to process, and then introspects its own
 module to see what special handler classes (like <code>MP3FileInfo</code>) are defined. You can extend this program to handle other types of files simply by defining an appropriately-named class:
-<code>HTMLFileInfo</code> for <acronym>HTML</acronym> files, <code>DOCFileInfo</code> for Word <code>.doc</code> files, and so forth. <code>listDirectory</code> will handle them all, without modification, by handing off the real work to the appropriate classes and collating the results.
+<code>HTMLFileInfo</code> for <abbr>HTML</abbr> files, <code>DOCFileInfo</code> for Word <code>.doc</code> files, and so forth. <code>listDirectory</code> will handle them all, without modification, by handing off the real work to the appropriate classes and collating the results.
 <h2 id="fileinfo.summary2">6.7. Summary</h2>
 <p>The <code>fileinfo.py</code> program introduced in <a href="#fileinfo">Chapter 5</a> should now make perfect sense.
 <pre><code>
@@ -2829,10 +2829,10 @@ if __name__ == "__main__":
 
 </ul>
 <div class=chapter>
-<h2 id="dialect">Chapter 8. <acronym>HTML</acronym> Processing</h2>
+<h2 id="dialect">Chapter 8. <abbr>HTML</abbr> Processing</h2>
 <h2 id="dialect.divein">8.1. Diving in</h2>
-<p>I often see questions on <a href="http://groups.google.com/groups?group=comp.lang.python">comp.lang.python</a> like &#8220;How can I list all the [headers|images|links] in my <acronym>HTML</acronym> document?&#8221;  &#8220;How do I parse/translate/munge the text of my <acronym>HTML</acronym> document but leave the tags alone?&#8221;  &#8220;How can I add/remove/quote attributes of all my <acronym>HTML</acronym> tags at once?&#8221;  This chapter will answer all of these questions.
-<p>Here is a complete, working Python program in two parts. The first part, <code>BaseHTMLProcessor.py</code>, is a generic tool to help you process <acronym>HTML</acronym> files by walking through the tags and text blocks. The second part, <code>dialect.py</code>, is an example of how to use <code>BaseHTMLProcessor.py</code> to translate the text of an <acronym>HTML</acronym> document but leave the tags alone. Read the <code>docstring</code>s and comments to get an overview of what's going on. Most of it will seem like black magic, because it's not obvious how
+<p>I often see questions on <a href="http://groups.google.com/groups?group=comp.lang.python">comp.lang.python</a> like &#8220;How can I list all the [headers|images|links] in my <abbr>HTML</abbr> document?&#8221;  &#8220;How do I parse/translate/munge the text of my <abbr>HTML</abbr> document but leave the tags alone?&#8221;  &#8220;How can I add/remove/quote attributes of all my <abbr>HTML</abbr> tags at once?&#8221;  This chapter will answer all of these questions.
+<p>Here is a complete, working Python program in two parts. The first part, <code>BaseHTMLProcessor.py</code>, is a generic tool to help you process <abbr>HTML</abbr> files by walking through the tags and text blocks. The second part, <code>dialect.py</code>, is an example of how to use <code>BaseHTMLProcessor.py</code> to translate the text of an <abbr>HTML</abbr> document but leave the tags alone. Read the <code>docstring</code>s and comments to get an overview of what's going on. Most of it will seem like black magic, because it's not obvious how
 any of these class methods ever get called. Don't worry, all will be revealed in due time.
 <div class=example><h3 id="dialect.basehtml.listing">Example 8.1. <code>BaseHTMLProcessor.py</code></h3>
 <p>If you have not already done so, you can <a href="http://diveintopython3.org/download/diveintopython3-examples-5.4.zip" title="Download example scripts">download this and other examples</a> used in this book.
@@ -3061,7 +3061,7 @@ def test(url):
 
 if __name__ == "__main__":
     test("http://diveintopython3.org/odbchelper_list.html")</pre><div class=example><h3>Example 8.3. Output of <code>dialect.py</code></h3>
-<p>Running this script will translate <a href="#odbchelper.list" title="3.2. Introducing Lists">Section 3.2, &#8220;Introducing Lists&#8221;</a> into <a href="../native_data_types/chef.html">mock Swedish Chef-speak</a> (from The Muppets), <a href="../native_data_types/fudd.html">mock Elmer Fudd-speak</a> (from Bugs Bunny cartoons), and <a href="../native_data_types/olde.html">mock Middle English</a> (loosely based on Chaucer's <i class=citetitle>The Canterbury Tales</i>). If you look at the <acronym>HTML</acronym> source of the output pages, you'll see that all the <acronym>HTML</acronym> tags and attributes are untouched, but the text between the tags has been &#8220;translated&#8221; into the mock language. If you look closer, you'll see that, in fact, only the titles and paragraphs were translated; the
+<p>Running this script will translate <a href="#odbchelper.list" title="3.2. Introducing Lists">Section 3.2, &#8220;Introducing Lists&#8221;</a> into <a href="../native_data_types/chef.html">mock Swedish Chef-speak</a> (from The Muppets), <a href="../native_data_types/fudd.html">mock Elmer Fudd-speak</a> (from Bugs Bunny cartoons), and <a href="../native_data_types/olde.html">mock Middle English</a> (loosely based on Chaucer's <i class=citetitle>The Canterbury Tales</i>). If you look at the <abbr>HTML</abbr> source of the output pages, you'll see that all the <abbr>HTML</abbr> tags and attributes are untouched, but the text between the tags has been &#8220;translated&#8221; into the mock language. If you look closer, you'll see that, in fact, only the titles and paragraphs were translated; the
    code listings and screen examples were left untouched.
 <pre><code>
 &lt;div class=abstract>
@@ -3072,34 +3072,34 @@ in &lt;span class=application>Powewbuiwdew&lt;/span>, bwace youwsewf fow
 &lt;span class=application>Pydon&lt;/span> wists.&lt;/p>
 &lt;/div>
 </pre><h2 id="dialect.sgmllib">8.2. Introducing <code>sgmllib.py</code></h2>
-<p><acronym>HTML</acronym> processing is broken into three steps: breaking down the <acronym>HTML</acronym> into its constituent pieces, fiddling with the pieces, and reconstructing the pieces into <acronym>HTML</acronym> again. The first step is done by <code>sgmllib.py</code>, a part of the standard Python library.
-<p>The key to understanding this chapter is to realize that <acronym>HTML</acronym> is not just text, it is structured text. The structure is derived from the more-or-less-hierarchical sequence of start tags
-and end tags. Usually you don't work with <acronym>HTML</acronym> this way; you work with it <em>textually</em> in a text editor, or <em>visually</em> in a web browser or web authoring tool. <code>sgmllib.py</code> presents <acronym>HTML</acronym> <em>structurally</em>.
-<p><code>sgmllib.py</code> contains one important class: <code>SGMLParser</code>. <code>SGMLParser</code> parses <acronym>HTML</acronym> into useful pieces, like start tags and end tags. As soon as it succeeds in breaking down some data into a useful piece,
-it calls a method on itself based on what it found. In order to use the parser, you subclass the <code>SGMLParser</code> class and override these methods. This is what I meant when I said that it presents <acronym>HTML</acronym> <em>structurally</em>: the structure of the <acronym>HTML</acronym> determines the sequence of method calls and the arguments passed to each method.
-<p><code>SGMLParser</code> parses <acronym>HTML</acronym> into 8 kinds of data, and calls a separate method for each of them:
+<p><abbr>HTML</abbr> processing is broken into three steps: breaking down the <abbr>HTML</abbr> into its constituent pieces, fiddling with the pieces, and reconstructing the pieces into <abbr>HTML</abbr> again. The first step is done by <code>sgmllib.py</code>, a part of the standard Python library.
+<p>The key to understanding this chapter is to realize that <abbr>HTML</abbr> is not just text, it is structured text. The structure is derived from the more-or-less-hierarchical sequence of start tags
+and end tags. Usually you don't work with <abbr>HTML</abbr> this way; you work with it <em>textually</em> in a text editor, or <em>visually</em> in a web browser or web authoring tool. <code>sgmllib.py</code> presents <abbr>HTML</abbr> <em>structurally</em>.
+<p><code>sgmllib.py</code> contains one important class: <code>SGMLParser</code>. <code>SGMLParser</code> parses <abbr>HTML</abbr> into useful pieces, like start tags and end tags. As soon as it succeeds in breaking down some data into a useful piece,
+it calls a method on itself based on what it found. In order to use the parser, you subclass the <code>SGMLParser</code> class and override these methods. This is what I meant when I said that it presents <abbr>HTML</abbr> <em>structurally</em>: the structure of the <abbr>HTML</abbr> determines the sequence of method calls and the arguments passed to each method.
+<p><code>SGMLParser</code> parses <abbr>HTML</abbr> into 8 kinds of data, and calls a separate method for each of them:
 <div class=variablelist>
 <dl>
 <dt>Start tag</dt>
-<dd>An <acronym>HTML</acronym> tag that starts a block, like <code>&lt;html></code>, <code>&lt;head></code>, <code>&lt;body></code>, or <code>&lt;pre></code>, or a standalone tag like <code>&lt;br></code> or <code>&lt;img></code>. When it finds a start tag <var><code>tagname</code></var>, <code>SGMLParser</code> will look for a method called <code>start_<var><code>tagname</code></var></code> or <code>do_<var><code>tagname</code></var></code>. For instance, when it finds a <code>&lt;pre></code> tag, it will look for a <code>start_pre</code> or <code>do_pre</code> method. If found, <code>SGMLParser</code> calls this method with a list of the tag's attributes; otherwise, it calls <code>unknown_starttag</code> with the tag name and list of attributes.
+<dd>An <abbr>HTML</abbr> tag that starts a block, like <code>&lt;html></code>, <code>&lt;head></code>, <code>&lt;body></code>, or <code>&lt;pre></code>, or a standalone tag like <code>&lt;br></code> or <code>&lt;img></code>. When it finds a start tag <var><code>tagname</code></var>, <code>SGMLParser</code> will look for a method called <code>start_<var><code>tagname</code></var></code> or <code>do_<var><code>tagname</code></var></code>. For instance, when it finds a <code>&lt;pre></code> tag, it will look for a <code>start_pre</code> or <code>do_pre</code> method. If found, <code>SGMLParser</code> calls this method with a list of the tag's attributes; otherwise, it calls <code>unknown_starttag</code> with the tag name and list of attributes.
 </dd>
 <dt>End tag</dt>
-<dd>An <acronym>HTML</acronym> tag that ends a block, like <code>&lt;/html></code>, <code>&lt;/head></code>, <code>&lt;/body></code>, or <code>&lt;/pre></code>. When it finds an end tag, <code>SGMLParser</code> will look for a method called <code>end_<var><code>tagname</code></var></code>. If found, <code>SGMLParser</code> calls this method, otherwise it calls <code>unknown_endtag</code> with the tag name.
+<dd>An <abbr>HTML</abbr> tag that ends a block, like <code>&lt;/html></code>, <code>&lt;/head></code>, <code>&lt;/body></code>, or <code>&lt;/pre></code>. When it finds an end tag, <code>SGMLParser</code> will look for a method called <code>end_<var><code>tagname</code></var></code>. If found, <code>SGMLParser</code> calls this method, otherwise it calls <code>unknown_endtag</code> with the tag name.
 </dd>
 <dt>Character reference</dt>
 <dd>An escaped character referenced by its decimal or hexadecimal equivalent, like <code>&amp;#160;</code>. When found, <code>SGMLParser</code> calls <code>handle_charref</code> with the text of the decimal or hexadecimal character equivalent.
 </dd>
 <dt>Entity reference</dt>
-<dd>An <acronym>HTML</acronym> entity, like <code>&amp;copy;</code>. When found, <code>SGMLParser</code> calls <code>handle_entityref</code> with the name of the <acronym>HTML</acronym> entity.
+<dd>An <abbr>HTML</abbr> entity, like <code>&amp;copy;</code>. When found, <code>SGMLParser</code> calls <code>handle_entityref</code> with the name of the <abbr>HTML</abbr> entity.
 </dd>
 <dt>Comment</dt>
-<dd>An <acronym>HTML</acronym> comment, enclosed in <code>&lt;!-- ... --></code>. When found, <code>SGMLParser</code> calls <code>handle_comment</code> with the body of the comment.
+<dd>An <abbr>HTML</abbr> comment, enclosed in <code>&lt;!-- ... --></code>. When found, <code>SGMLParser</code> calls <code>handle_comment</code> with the body of the comment.
 </dd>
 <dt>Processing instruction</dt>
-<dd>An <acronym>HTML</acronym> processing instruction, enclosed in <code>&lt;? ... ></code>. When found, <code>SGMLParser</code> calls <code>handle_pi</code> with the body of the processing instruction.
+<dd>An <abbr>HTML</abbr> processing instruction, enclosed in <code>&lt;? ... ></code>. When found, <code>SGMLParser</code> calls <code>handle_pi</code> with the body of the processing instruction.
 </dd>
 <dt>Declaration</dt>
-<dd>An <acronym>HTML</acronym> declaration, such as a <code>DOCTYPE</code>, enclosed in <code>&lt;! ... ></code>. When found, <code>SGMLParser</code> calls <code>handle_decl</code> with the body of the declaration.
+<dd>An <abbr>HTML</abbr> declaration, such as a <code>DOCTYPE</code>, enclosed in <code>&lt;! ... ></code>. When found, <code>SGMLParser</code> calls <code>handle_decl</code> with the body of the declaration.
 </dd>
 <dt>Text data</dt>
 <dd>A block of text. Anything that doesn't fit into the other 7 categories. When found, <code>SGMLParser</code> calls <code>handle_data</code> with the text.
@@ -3108,13 +3108,13 @@ it calls a method on itself based on what it found. In order to use the parser,
 <table class=important border="0" summary="">
 
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/important.png" alt="Important" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Python 2.0 had a bug where <code>SGMLParser</code> would not recognize declarations at all (<code>handle_decl</code> would never be called), which meant that <code>DOCTYPE</code>s were silently ignored. This is fixed in Python 2.1.
-<p><code>sgmllib.py</code> comes with a test suite to illustrate this. You can run <code>sgmllib.py</code>, passing the name of an <acronym>HTML</acronym> file on the command line, and it will print out the tags and other elements as it parses them. It does this by subclassing
+<p><code>sgmllib.py</code> comes with a test suite to illustrate this. You can run <code>sgmllib.py</code>, passing the name of an <abbr>HTML</abbr> file on the command line, and it will print out the tags and other elements as it parses them. It does this by subclassing
 the <code>SGMLParser</code> class and defining <code>unknown_starttag</code>, <code>unknown_endtag</code>, <code>handle_data</code> and other methods which simply print their arguments.
 <table id="tip.commandline.windows" class=tip border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <acronym>IDE</acronym> on Windows, you can specify command line arguments in the &#8220;Run script&#8221; dialog. Separate multiple arguments with spaces.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/tip.png" alt="Tip" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">In the ActivePython <abbr>IDE</abbr> on Windows, you can specify command line arguments in the &#8220;Run script&#8221; dialog. Separate multiple arguments with spaces.
 <div class=example><h3>Example 8.4. Sample test of <code>sgmllib.py</code></h3>
-<p>Here is a snippet from the table of contents of the <acronym>HTML</acronym> version of this book. Of course your paths may vary. (If you haven't downloaded the <acronym>HTML</acronym> version of the book, you can do so at <a href="http://diveintopython3.org/">http://diveintopython3.org/</a>.
+<p>Here is a snippet from the table of contents of the <abbr>HTML</abbr> version of this book. Of course your paths may vary. (If you haven't downloaded the <abbr>HTML</abbr> version of the book, you can do so at <a href="http://diveintopython3.org/">http://diveintopython3.org/</a>.
 <pre class=screen>
 <samp class=prompt>c:\python23\lib></samp> type "c:\downloads\diveintopython3\html\toc\index.html"
 <code>
@@ -3148,11 +3148,11 @@ data: '\n      '
 </span></pre><p>Here's the roadmap for the rest of the chapter:
 <div class=itemizedlist>
 <ul>
-<li>Subclass <code>SGMLParser</code> to create classes that extract interesting data out of <acronym>HTML</acronym> documents.
+<li>Subclass <code>SGMLParser</code> to create classes that extract interesting data out of <abbr>HTML</abbr> documents.
 
-<li>Subclass <code>SGMLParser</code> to create <code>BaseHTMLProcessor</code>, which overrides all 8 handler methods and uses them to reconstruct the original <acronym>HTML</acronym> from the pieces.
+<li>Subclass <code>SGMLParser</code> to create <code>BaseHTMLProcessor</code>, which overrides all 8 handler methods and uses them to reconstruct the original <abbr>HTML</abbr> from the pieces.
 
-<li>Subclass <code>BaseHTMLProcessor</code> to create <code>Dialectizer</code>, which adds some methods to process specific <acronym>HTML</acronym> tags specially, and overrides the <code>handle_data</code> method to provide a framework for processing the text blocks between the <acronym>HTML</acronym> tags.
+<li>Subclass <code>BaseHTMLProcessor</code> to create <code>Dialectizer</code>, which adds some methods to process specific <abbr>HTML</abbr> tags specially, and overrides the <code>handle_data</code> method to provide a framework for processing the text blocks between the <abbr>HTML</abbr> tags.
 
 <li>Subclass <code>Dialectizer</code> to create classes that define text processing rules used by <code>Dialectizer.handle_data</code>.
 
@@ -3160,9 +3160,9 @@ data: '\n      '
 
 </ul>
 <p>Along the way, you'll also learn about <code>locals</code>, <code>globals</code>, and dictionary-based string formatting.
-<h2 id="dialect.extract">8.3. Extracting data from <acronym>HTML</acronym> documents</h2>
-<p>To extract data from <acronym>HTML</acronym> documents, subclass the <code>SGMLParser</code> class and define methods for each tag or entity you want to capture.
-<p>The first step to extracting data from an <acronym>HTML</acronym> document is getting some <acronym>HTML</acronym>. If you have some <acronym>HTML</acronym> lying around on your hard drive, you can use <a href="#fileinfo.files" title="6.2. Working with File Objects">file functions</a> to read it, but the real fun begins when you get <acronym>HTML</acronym> from live web pages.
+<h2 id="dialect.extract">8.3. Extracting data from <abbr>HTML</abbr> documents</h2>
+<p>To extract data from <abbr>HTML</abbr> documents, subclass the <code>SGMLParser</code> class and define methods for each tag or entity you want to capture.
+<p>The first step to extracting data from an <abbr>HTML</abbr> document is getting some <abbr>HTML</abbr>. If you have some <abbr>HTML</abbr> lying around on your hard drive, you can use <a href="#fileinfo.files" title="6.2. Working with File Objects">file functions</a> to read it, but the real fun begins when you get <abbr>HTML</abbr> from live web pages.
 <div class=example><h3 id="dialect.extract.urllib">Example 8.5. Introducing <code>urllib</code></h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>import urllib</kbd>   <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>sock = urllib.urlopen("http://diveintopython3.org/")</kbd> <span>&#x2461;</span>
@@ -3185,11 +3185,11 @@ data: '\n      '
 
 [...snip...]</pre><div class=calloutlist>
 <ol>
-<li>The <code>urllib</code> module is part of the standard Python library. It contains functions for getting information about and actually retrieving data from Internet-based <acronym>URL</acronym>s (mainly web pages).
-<li>The simplest use of <code>urllib</code> is to retrieve the entire text of a web page using the <code>urlopen</code> function. Opening a <acronym>URL</acronym> is similar to <a href="#fileinfo.files" title="6.2. Working with File Objects">opening a file</a>. The return value of <code>urlopen</code> is a file-like object, which has some of the same methods as a file object.
-<li>The simplest thing to do with the file-like object returned by <code>urlopen</code> is <code>read</code>, which reads the entire <acronym>HTML</acronym> of the web page into a single string. The object also supports <code>readlines</code>, which reads the text line by line into a list.
+<li>The <code>urllib</code> module is part of the standard Python library. It contains functions for getting information about and actually retrieving data from Internet-based <abbr>URL</abbr>s (mainly web pages).
+<li>The simplest use of <code>urllib</code> is to retrieve the entire text of a web page using the <code>urlopen</code> function. Opening a <abbr>URL</abbr> is similar to <a href="#fileinfo.files" title="6.2. Working with File Objects">opening a file</a>. The return value of <code>urlopen</code> is a file-like object, which has some of the same methods as a file object.
+<li>The simplest thing to do with the file-like object returned by <code>urlopen</code> is <code>read</code>, which reads the entire <abbr>HTML</abbr> of the web page into a single string. The object also supports <code>readlines</code>, which reads the text line by line into a list.
 <li>When you're done with the object, make sure to <code>close</code> it, just like a normal file object.
-<li>You now have the complete <acronym>HTML</acronym> of the home page of <code>http://diveintopython3.org/</code> in a string, and you're ready to parse it.
+<li>You now have the complete <abbr>HTML</abbr> of the home page of <code>http://diveintopython3.org/</code> in a string, and you're ready to parse it.
 <div class=example><h3 id="dialect.extract.links">Example 8.6. Introducing <code>urllister.py</code></h3>
 <p>If you have not already done so, you can <a href="http://diveintopython3.org/download/diveintopython3-examples-5.4.zip" title="Download example scripts">download this and other examples</a> used in this book.
 <pre><code>
@@ -3207,7 +3207,7 @@ class URLLister(SGMLParser):
 <ol>
 <li><code>reset</code> is called by the <code>__init__</code> method of <code>SGMLParser</code>, and it can also be called manually once an instance of the parser has been created. So if you need to do any initialization,
             do it in <code>reset</code>, not in <code>__init__</code>, so that it will be re-initialized properly when someone re-uses a parser instance.
-<li><code>start_a</code> is called by <code>SGMLParser</code> whenever it finds an <code>&lt;a></code> tag. The tag may contain an <code>href</code> attribute, and/or other attributes, like <code>name</code> or <code>title</code>. The <var>attrs</var> parameter is a list of tuples, <code>[(<var>attribute</var>, <var>value</var>), (<var>attribute</var>, <var>value</var>), ...]</code>. Or it may be just an <code>&lt;a></code>, a valid (if useless) <acronym>HTML</acronym> tag, in which case <var>attrs</var> would be an empty list.
+<li><code>start_a</code> is called by <code>SGMLParser</code> whenever it finds an <code>&lt;a></code> tag. The tag may contain an <code>href</code> attribute, and/or other attributes, like <code>name</code> or <code>title</code>. The <var>attrs</var> parameter is a list of tuples, <code>[(<var>attribute</var>, <var>value</var>), (<var>attribute</var>, <var>value</var>), ...]</code>. Or it may be just an <code>&lt;a></code>, a valid (if useless) <abbr>HTML</abbr> tag, in which case <var>attrs</var> would be an empty list.
 <li>You can find out whether this <code>&lt;a></code> tag has an <code>href</code> attribute with a simple <a href="#odbchelper.multiassign" title="3.4.2. Assigning Multiple Values at Once">multi-variable</a> <a href="#odbchelper.map" title="3.6. Mapping Lists">list comprehension</a>.
 <li>String comparisons like <code>k=='href'</code> are always case-sensitive, but that's safe in this case, because <code>SGMLParser</code> converts attribute names to lowercase while building <var>attrs</var>.
 <div class=example><h3 id="dialect.feed.example">Example 8.7. Using <code>urllister.py</code></h3><pre class=screen>
@@ -3234,15 +3234,15 @@ download/diveintopython3-common-5.0.zip
 
 ... rest of output omitted for brevity ...</pre><div class=calloutlist>
 <ol>
-<li>Call the <code>feed</code> method, defined in <code>SGMLParser</code>, to get <acronym>HTML</acronym> into the parser.
+<li>Call the <code>feed</code> method, defined in <code>SGMLParser</code>, to get <abbr>HTML</abbr> into the parser.
 <sup>[<a name="d0e20503" href="#ftn.d0e20503">1</a>]</sup>  It takes a string, which is what <code>usock.read()</code> returns.
-<li>Like files, you should <code>close</code> your <acronym>URL</acronym> objects as soon as you're done with them.
-<li>You should <code>close</code> your parser object, too, but for a different reason. You've read all the data and fed it to the parser, but the <code>feed</code> method isn't guaranteed to have actually processed all the <acronym>HTML</acronym> you give it; it may buffer it, waiting for more. Be sure to call <code>close</code> to flush the buffer and force everything to be fully parsed.
-<li>Once the parser is <code>close</code>d, the parsing is complete, and <var>parser.urls</var> contains a list of all the linked <acronym>URL</acronym>s in the <acronym>HTML</acronym> document. (Your output may look different, if the download links have been updated by the time you read this.)
+<li>Like files, you should <code>close</code> your <abbr>URL</abbr> objects as soon as you're done with them.
+<li>You should <code>close</code> your parser object, too, but for a different reason. You've read all the data and fed it to the parser, but the <code>feed</code> method isn't guaranteed to have actually processed all the <abbr>HTML</abbr> you give it; it may buffer it, waiting for more. Be sure to call <code>close</code> to flush the buffer and force everything to be fully parsed.
+<li>Once the parser is <code>close</code>d, the parsing is complete, and <var>parser.urls</var> contains a list of all the linked <abbr>URL</abbr>s in the <abbr>HTML</abbr> document. (Your output may look different, if the download links have been updated by the time you read this.)
 <h2 id="dialect.basehtml">8.4. Introducing <code>BaseHTMLProcessor.py</code></h2>
 <p><code>SGMLParser</code> doesn't produce anything by itself. It parses and parses and parses, and it calls a method for each interesting thing it
-   finds, but the methods don't do anything. <code>SGMLParser</code> is an <acronym>HTML</acronym> <em>consumer</em>: it takes <acronym>HTML</acronym> and breaks it down into small, structured pieces. As you saw in the <a href="#dialect.extract" title="8.3. Extracting data from HTML documents">previous section</a>, you can subclass <code>SGMLParser</code> to define classes that catch specific tags and produce useful things, like a list of all the links on a web page. Now you'll
-   take this one step further by defining a class that catches everything <code>SGMLParser</code> throws at it and reconstructs the complete <acronym>HTML</acronym> document. In technical terms, this class will be an <acronym>HTML</acronym> <em>producer</em>.
+   finds, but the methods don't do anything. <code>SGMLParser</code> is an <abbr>HTML</abbr> <em>consumer</em>: it takes <abbr>HTML</abbr> and breaks it down into small, structured pieces. As you saw in the <a href="#dialect.extract" title="8.3. Extracting data from HTML documents">previous section</a>, you can subclass <code>SGMLParser</code> to define classes that catch specific tags and produce useful things, like a list of all the links on a web page. Now you'll
+   take this one step further by defining a class that catches everything <code>SGMLParser</code> throws at it and reconstructs the complete <abbr>HTML</abbr> document. In technical terms, this class will be an <abbr>HTML</abbr> <em>producer</em>.
 <p><code>BaseHTMLProcessor</code> subclasses <code>SGMLParser</code> and provides all 8 essential handler methods: <code>unknown_starttag</code>, <code>unknown_endtag</code>, <code>handle_charref</code>, <code>handle_entityref</code>, <code>handle_comment</code>, <code>handle_pi</code>, <code>handle_decl</code>, and <code>handle_data</code>.
 <div class=example><h3 id="dialect.basehtml.intro">Example 8.8. Introducing <code>BaseHTMLProcessor</code></h3><pre><code>
 class BaseHTMLProcessor(SGMLParser):
@@ -3277,27 +3277,27 @@ class BaseHTMLProcessor(SGMLParser):
     def handle_decl(self, text):
         self.pieces.append("&lt;!%(text)s>" % locals())</pre><div class=calloutlist>
 <ol>
-<li><code>reset</code>, called by <code>SGMLParser.__init__</code>, initializes <var>self.pieces</var> as an empty list before <a href="#fileinfo.init.code.example" title="Example 5.6. Coding the FileInfo Class">calling the ancestor method</a>. <var>self.pieces</var> is a <a href="#fileinfo.userdict.init.example" title="Example 5.9. Defining the UserDict Class">data attribute</a> which will hold the pieces of the <acronym>HTML</acronym> document you're constructing. Each handler method will reconstruct the <acronym>HTML</acronym> that <code>SGMLParser</code> parsed, and each method will append that string to <var>self.pieces</var>. Note that <var>self.pieces</var> is a list. You might be tempted to define it as a string and just keep appending each piece to it. That would work, but
+<li><code>reset</code>, called by <code>SGMLParser.__init__</code>, initializes <var>self.pieces</var> as an empty list before <a href="#fileinfo.init.code.example" title="Example 5.6. Coding the FileInfo Class">calling the ancestor method</a>. <var>self.pieces</var> is a <a href="#fileinfo.userdict.init.example" title="Example 5.9. Defining the UserDict Class">data attribute</a> which will hold the pieces of the <abbr>HTML</abbr> document you're constructing. Each handler method will reconstruct the <abbr>HTML</abbr> that <code>SGMLParser</code> parsed, and each method will append that string to <var>self.pieces</var>. Note that <var>self.pieces</var> is a list. You might be tempted to define it as a string and just keep appending each piece to it. That would work, but
 Python is much more efficient at dealing with lists.
-<sup>[<a name="d0e20702" href="#ftn.d0e20702">2</a>]</sup><li>Since <code>BaseHTMLProcessor</code> does not define any methods for specific tags (like the <code>start_a</code> method in <a href="#dialect.extract.links" title="Example 8.6. Introducing urllister.py"><code>URLLister</code></a>), <code>SGMLParser</code> will call <code>unknown_starttag</code> for every start tag. This method takes the tag (<var>tag</var>) and the list of attribute name/value pairs (<var>attrs</var>), reconstructs the original <acronym>HTML</acronym>, and appends it to <var>self.pieces</var>. The <a href="#odbchelper.stringformatting" title="3.5. Formatting Strings">string formatting</a> here is a little strange; you'll untangle that (and also the odd-looking <code>locals</code> function) later in this chapter.
+<sup>[<a name="d0e20702" href="#ftn.d0e20702">2</a>]</sup><li>Since <code>BaseHTMLProcessor</code> does not define any methods for specific tags (like the <code>start_a</code> method in <a href="#dialect.extract.links" title="Example 8.6. Introducing urllister.py"><code>URLLister</code></a>), <code>SGMLParser</code> will call <code>unknown_starttag</code> for every start tag. This method takes the tag (<var>tag</var>) and the list of attribute name/value pairs (<var>attrs</var>), reconstructs the original <abbr>HTML</abbr>, and appends it to <var>self.pieces</var>. The <a href="#odbchelper.stringformatting" title="3.5. Formatting Strings">string formatting</a> here is a little strange; you'll untangle that (and also the odd-looking <code>locals</code> function) later in this chapter.
 <li>Reconstructing end tags is much simpler; just take the tag name and wrap it in the <code>&lt;/...></code> brackets.
-<li>When <code>SGMLParser</code> finds a character reference, it calls <code>handle_charref</code> with the bare reference. If the <acronym>HTML</acronym> document contains the reference <code>&amp;#160;</code>, <var>ref</var> will be <code>160</code>. Reconstructing the original complete character reference just involves wrapping <var>ref</var> in <code>&amp;#...;</code> characters.
+<li>When <code>SGMLParser</code> finds a character reference, it calls <code>handle_charref</code> with the bare reference. If the <abbr>HTML</abbr> document contains the reference <code>&amp;#160;</code>, <var>ref</var> will be <code>160</code>. Reconstructing the original complete character reference just involves wrapping <var>ref</var> in <code>&amp;#...;</code> characters.
 <li>Entity references are similar to character references, but without the hash mark. Reconstructing the original entity reference
             requires wrapping <var>ref</var> in <code>&amp;...;</code> characters. (Actually, as an erudite reader pointed out to me, it's slightly more complicated than this. Only certain standard
-<acronym>HTML</acronym> entites end in a semicolon; other similar-looking entities do not. Luckily for us, the set of standard <acronym>HTML</acronym> entities is defined in a dictionary in a Python module called <code>htmlentitydefs</code>. Hence the extra <code>if</code> statement.)
+<abbr>HTML</abbr> entites end in a semicolon; other similar-looking entities do not. Luckily for us, the set of standard <abbr>HTML</abbr> entities is defined in a dictionary in a Python module called <code>htmlentitydefs</code>. Hence the extra <code>if</code> statement.)
 <li>Blocks of text are simply appended to <var>self.pieces</var> unaltered.
-<li><acronym>HTML</acronym> comments are wrapped in <code>&lt;!--...--></code> characters.
+<li><abbr>HTML</abbr> comments are wrapped in <code>&lt;!--...--></code> characters.
 <li>Processing instructions are wrapped in <code>&lt;?...></code> characters.
 <table class=important border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/important.png" alt="Important" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">The <acronym>HTML</acronym> specification requires that all non-<acronym>HTML</acronym> (like client-side JavaScript) must be enclosed in <acronym>HTML</acronym> comments, but not all web pages do this properly (and all modern web browsers are forgiving if they don't). <code>BaseHTMLProcessor</code> is not forgiving; if script is improperly embedded, it will be parsed as if it were <acronym>HTML</acronym>. For instance, if the script contains less-than and equals signs, <code>SGMLParser</code> may incorrectly think that it has found tags and attributes. <code>SGMLParser</code> always converts tags and attribute names to lowercase, which may break the script, and <code>BaseHTMLProcessor</code> always encloses attribute values in double quotes (even if the original <acronym>HTML</acronym> document used single quotes or no quotes), which will certainly break the script. Always protect your client-side script
-      within <acronym>HTML</acronym> comments.
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/important.png" alt="Important" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">The <abbr>HTML</abbr> specification requires that all non-<abbr>HTML</abbr> (like client-side JavaScript) must be enclosed in <abbr>HTML</abbr> comments, but not all web pages do this properly (and all modern web browsers are forgiving if they don't). <code>BaseHTMLProcessor</code> is not forgiving; if script is improperly embedded, it will be parsed as if it were <abbr>HTML</abbr>. For instance, if the script contains less-than and equals signs, <code>SGMLParser</code> may incorrectly think that it has found tags and attributes. <code>SGMLParser</code> always converts tags and attribute names to lowercase, which may break the script, and <code>BaseHTMLProcessor</code> always encloses attribute values in double quotes (even if the original <abbr>HTML</abbr> document used single quotes or no quotes), which will certainly break the script. Always protect your client-side script
+      within <abbr>HTML</abbr> comments.
 <div class=example><h3 id="dialect.output.example">Example 8.9. <code>BaseHTMLProcessor</code> output</h3><pre><code>
     def output(self):               <span>&#x2460;</span>
         """Return processed HTML as a single string"""
         return "".join(self.pieces) <span>&#x2461;</span></pre><div class=calloutlist>
 <ol>
-<li>This is the one method in <code>BaseHTMLProcessor</code> that is never called by the ancestor <code>SGMLParser</code>. Since the other handler methods store their reconstructed <acronym>HTML</acronym> in <var>self.pieces</var>, this function is needed to join all those pieces into one string. As noted before, Python is great at lists and mediocre at strings, so you only create the complete string when somebody explicitly asks for it.
+<li>This is the one method in <code>BaseHTMLProcessor</code> that is never called by the ancestor <code>SGMLParser</code>. Since the other handler methods store their reconstructed <abbr>HTML</abbr> in <var>self.pieces</var>, this function is needed to join all those pieces into one string. As noted before, Python is great at lists and mediocre at strings, so you only create the complete string when somebody explicitly asks for it.
 <li>If you prefer, you could use the <code>join</code> method of the <code>string</code> module instead: <code>string.join(self.pieces, "")</code><div class=itemizedlist>
 <h3>Further reading</h3>
 <ul>
@@ -3307,7 +3307,7 @@ Python is much more efficient at dealing with lists.
 
 </ul>
 <h2 id="dialect.locals">8.5. <code>locals</code> and <code>globals</code></h2>
-<p>Let's digress from <acronym>HTML</acronym> processing for a minute and talk about how Python handles variables. Python has two built-in functions, <code>locals</code> and <code>globals</code>, which provide dictionary-based access to local and global variables.
+<p>Let's digress from <abbr>HTML</abbr> processing for a minute and talk about how Python handles variables. Python has two built-in functions, <code>locals</code> and <code>globals</code>, which provide dictionary-based access to local and global variables.
 <p>Remember <code>locals</code>?  You first saw it here:
 <pre><code>
     def unknown_starttag(self, tag, attrs):
@@ -3458,8 +3458,8 @@ meaningful keys and values already. Like <a href="#dialect.locals" title="8.5. l
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/important.png" alt="Important" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Using dictionary-based string formatting with <code>locals</code> is a convenient way of making complex string formatting expressions more readable, but it comes with a price. There is a
       slight performance hit in making the call to <code>locals</code>, since <a href="#dialect.locals.readonly.example" title="Example 8.12. locals is read-only, globals is not"><code>locals</code> builds a copy</a> of the local namespace.
 <h2 id="dialect.quoting">8.7. Quoting attribute values</h2>
-<p>A common question on <a href="http://groups.google.com/groups?group=comp.lang.python">comp.lang.python</a> is &#8220;I have a bunch of <acronym>HTML</acronym> documents with unquoted attribute values, and I want to properly quote them all. How can I do this?&#8221;<sup>[<a name="d0e21764" href="#ftn.d0e21764">4</a>]</sup>  (This is generally precipitated by a project manager who has found the <acronym>HTML</acronym>-is-a-standard religion joining a large project and proclaiming that all pages must validate against an <acronym>HTML</acronym> validator. Unquoted attribute values are a common violation of the <acronym>HTML</acronym> standard.)  Whatever the reason, unquoted attribute values are easy to fix by feeding <acronym>HTML</acronym> through <code>BaseHTMLProcessor</code>.
-<p><code>BaseHTMLProcessor</code> consumes <acronym>HTML</acronym> (since it's descended from <code>SGMLParser</code>) and produces equivalent <acronym>HTML</acronym>, but the <acronym>HTML</acronym> output is not identical to the input. Tags and attribute names will end up in lowercase, even if they started in uppercase
+<p>A common question on <a href="http://groups.google.com/groups?group=comp.lang.python">comp.lang.python</a> is &#8220;I have a bunch of <abbr>HTML</abbr> documents with unquoted attribute values, and I want to properly quote them all. How can I do this?&#8221;<sup>[<a name="d0e21764" href="#ftn.d0e21764">4</a>]</sup>  (This is generally precipitated by a project manager who has found the <abbr>HTML</abbr>-is-a-standard religion joining a large project and proclaiming that all pages must validate against an <abbr>HTML</abbr> validator. Unquoted attribute values are a common violation of the <abbr>HTML</abbr> standard.)  Whatever the reason, unquoted attribute values are easy to fix by feeding <abbr>HTML</abbr> through <code>BaseHTMLProcessor</code>.
+<p><code>BaseHTMLProcessor</code> consumes <abbr>HTML</abbr> (since it's descended from <code>SGMLParser</code>) and produces equivalent <abbr>HTML</abbr>, but the <abbr>HTML</abbr> output is not identical to the input. Tags and attribute names will end up in lowercase, even if they started in uppercase
 or mixed case, and attribute values will be enclosed in double quotes, even if they started in single quotes or with no quotes
 at all. It is this last side effect that you can take advantage of.
 <div class=example><h3 id="dialect.quoting.example">Example 8.16. Quoting attribute values</h3><pre class=screen>
@@ -3492,10 +3492,10 @@ at all. It is this last side effect that you can take advantage of.
 &lt;/body>
 &lt;/html></span></pre><div class=calloutlist>
 <ol>
-<li>Note that the attribute values of the <code>href</code> attributes in the <code>&lt;a></code> tags are not properly quoted. (Also note that you're using <a href="#odbchelper.triplequotes" title="Example 2.2. Defining the buildConnectionString Function's docstring">triple quotes</a> for something other than a <code>docstring</code>. And directly in the <acronym>IDE</acronym>, no less. They're very useful.)
+<li>Note that the attribute values of the <code>href</code> attributes in the <code>&lt;a></code> tags are not properly quoted. (Also note that you're using <a href="#odbchelper.triplequotes" title="Example 2.2. Defining the buildConnectionString Function's docstring">triple quotes</a> for something other than a <code>docstring</code>. And directly in the <abbr>IDE</abbr>, no less. They're very useful.)
 <li>Feed the parser.
 <li>Using the <code>output</code> function defined in <code>BaseHTMLProcessor</code>, you get the output as a single string, complete with quoted attribute values. While this may seem anti-climactic, think
-            about how much has actually happened here: <code>SGMLParser</code> parsed the entire <acronym>HTML</acronym> document, breaking it down into tags, refs, data, and so forth; <code>BaseHTMLProcessor</code> used those elements to reconstruct pieces of <acronym>HTML</acronym> (which are still stored in <var>parser.pieces</var>, if you want to see them); finally, you called <code>parser.output</code>, which joined all the pieces of <acronym>HTML</acronym> into one string.
+            about how much has actually happened here: <code>SGMLParser</code> parsed the entire <abbr>HTML</abbr> document, breaking it down into tags, refs, data, and so forth; <code>BaseHTMLProcessor</code> used those elements to reconstruct pieces of <abbr>HTML</abbr> (which are still stored in <var>parser.pieces</var>, if you want to see them); finally, you called <code>parser.output</code>, which joined all the pieces of <abbr>HTML</abbr> into one string.
 <h2 id="dialect.dialectizer">8.8. Introducing <code>dialect.py</code></h2>
 <p><code>Dialectizer</code> is a simple (and silly) descendant of <code>BaseHTMLProcessor</code>. It runs blocks of text through a series of substitutions, but it makes sure that anything within a <code><code>&lt;pre></code>...<code>&lt;/pre></code></code> block passes through unaltered.
 <p>To handle the <code>&lt;pre></code> blocks, you define two methods in <code>Dialectizer</code>: <code>start_pre</code> and <code>end_pre</code>.
@@ -3508,7 +3508,7 @@ at all. It is this last side effect that you can take advantage of.
         self.unknown_endtag("pre")          <span>&#x2464;</span>
         self.verbatim -= 1<span>&#x2465;</span></pre><div class=calloutlist>
 <ol>
-<li><code>start_pre</code> is called every time <code>SGMLParser</code> finds a <code>&lt;pre></code> tag in the <acronym>HTML</acronym> source. (In a minute, you'll see exactly how this happens.)  The method takes a single parameter, <var>attrs</var>, which contains the attributes of the tag (if any). <var>attrs</var> is a list of key/value tuples, just like <a href="#dialect.unknownstarttag" title="Example 8.14. Dictionary-based string formatting in BaseHTMLProcessor.py"><code>unknown_starttag</code></a> takes.
+<li><code>start_pre</code> is called every time <code>SGMLParser</code> finds a <code>&lt;pre></code> tag in the <abbr>HTML</abbr> source. (In a minute, you'll see exactly how this happens.)  The method takes a single parameter, <var>attrs</var>, which contains the attributes of the tag (if any). <var>attrs</var> is a list of key/value tuples, just like <a href="#dialect.unknownstarttag" title="Example 8.14. Dictionary-based string formatting in BaseHTMLProcessor.py"><code>unknown_starttag</code></a> takes.
 <li>In the <code>reset</code> method, you initialize a data attribute that serves as a counter for <code>&lt;pre></code> tags. Every time you hit a <code>&lt;pre></code> tag, you increment the counter; every time you hit a <code>&lt;/pre></code> tag, you'll decrement the counter. (You could just use this as a flag and set it to <code>1</code> and reset it to <code>0</code>, but it's just as easy to do it this way, and this handles the odd (but possible) case of nested <code>&lt;pre></code> tags.)  In a minute, you'll see how this counter is put to good use.
 <li>That's it, that's the only special processing you do for <code>&lt;pre></code> tags. Now you pass the list of attributes along to <code>unknown_starttag</code> so it can do the default processing.
 <li><code>end_pre</code> is called every time <code>SGMLParser</code> finds a <code>&lt;/pre></code> tag. Since end tags can not contain attributes, the method takes no parameters.
@@ -3563,7 +3563,7 @@ you need to override the <code>handle_data</code> method.
 <li>In the ancestor <a href="#dialect.basehtml.intro" title="Example 8.8. Introducing BaseHTMLProcessor"><code>BaseHTMLProcessor</code></a>, the <code>handle_data</code> method simply appended the text to the output buffer, <var>self.pieces</var>. Here the logic is only slightly more complicated. If you're in the middle of a <code><code>&lt;pre></code>...<code>&lt;/pre></code></code> block, <var>self.verbatim</var> will be some value greater than <code>0</code>, and you want to put the text in the output buffer unaltered. Otherwise, you will call a separate method to process the
             substitutions, then put the result of that into the output buffer. In Python, this is a one-liner, using <a href="#apihelper.andortrick.intro" title="Example 4.17. Introducing the and-or Trick">the <code>and-or</code> trick</a>.
 <p>You're close to completely understanding <code>Dialectizer</code>. The only missing link is the nature of the text substitutions themselves. If you know any Perl, you know that when complex text substitutions are required, the only real solution is regular expressions. The classes
-later in <code>dialect.py</code> define a series of regular expressions that operate on the text between the <acronym>HTML</acronym> tags. But you just had <a href="#re" title="Chapter 7. Regular Expressions">a whole chapter on regular expressions</a>. You don't really want to slog through regular expressions again, do you?  God knows I don't. I think you've learned enough
+later in <code>dialect.py</code> define a series of regular expressions that operate on the text between the <abbr>HTML</abbr> tags. But you just had <a href="#re" title="Chapter 7. Regular Expressions">a whole chapter on regular expressions</a>. You don't really want to slog through regular expressions again, do you?  God knows I don't. I think you've learned enough
 for one chapter.
 <h2 id="dialect.alltogether">8.9. Putting it all together</h2>
 <p>It's time to put everything you've learned so far to good use. I hope you were paying attention.
@@ -3596,7 +3596,7 @@ def translate(url, dialectName="chef"): <span>&#x2460;</span>
 <p>Why bother?  After all, there are only 3 <code>Dialectizer</code> classes; why not just use a <code>case</code> statement?  (Well, there's no <code>case</code> statement in Python, but why not just use a series of <code>if</code> statements?)  One reason: extensibility. The <code>translate</code> function has absolutely no idea how many Dialectizer classes you've defined. Imagine if you defined a new <code>FooDialectizer</code> tomorrow; <code>translate</code> would work by passing <code>'foo'</code> as the <var>dialectName</var>.
 <p>Even better, imagine putting <code>FooDialectizer</code> in a separate module, and importing it with <code>from <var>module</var> import</code>. You've already seen that this <a href="#dialect.globals.example" title="Example 8.11. Introducing globals">includes it in <code>globals</code>()</a>, so <code>translate</code> would still work without modification, even though <code>FooDialectizer</code> was in a separate file.
 <p>Now imagine that the name of the dialect is coming from somewhere outside the program, maybe from a database or from a user-inputted
-value on a form. You can use any number of server-side Python scripting architectures to dynamically generate web pages; this function could take a <acronym>URL</acronym> and a dialect name (both strings) in the query string of a web page request, and output the &#8220;translated&#8221; web page.
+value on a form. You can use any number of server-side Python scripting architectures to dynamically generate web pages; this function could take a <abbr>URL</abbr> and a dialect name (both strings) in the query string of a web page request, and output the &#8220;translated&#8221; web page.
 <p>Finally, imagine a <code>Dialectizer</code> framework with a plug-in architecture. You could put each <code>Dialectizer</code> class in a separate file, leaving only the <code>translate</code> function in <code>dialect.py</code>. Assuming a consistent naming scheme, the <code>translate</code> function could dynamic import the appropiate class from the appropriate file, given nothing but the dialect name. (You haven't
 seen dynamic importing yet, but I promise to cover it in a later chapter.)  To add a new dialect, you would simply add an
 appropriately-named file in the plug-ins directory (like <code>foodialect.py</code> which contains the <code>FooDialectizer</code> class). Calling the <code>translate</code> function with the dialect name <code>'foo'</code> would find the module <code>foodialect.py</code>, import the class <code>FooDialectizer</code>, and away you go.
@@ -3606,12 +3606,12 @@ appropriately-named file in the plug-ins directory (like <code>foodialect.py</co
     return parser.output()  <span>&#x2462;</span>
 </pre><div class=calloutlist>
 <ol>
-<li>After all that imagining, this is going to seem pretty boring, but the <code>feed</code> function is what <a href="#dialect.feed.example" title="Example 8.7. Using urllister.py">does the entire transformation</a>. You had the entire <acronym>HTML</acronym> source in a single string, so you only had to call <code>feed</code> once. However, you can call <code>feed</code> as often as you want, and the parser will just keep parsing. So if you were worried about memory usage (or you knew you
-            were going to be dealing with very large <acronym>HTML</acronym> pages), you could set this up in a loop, where you read a few bytes of <acronym>HTML</acronym> and fed it to the parser. The result would be the same.
+<li>After all that imagining, this is going to seem pretty boring, but the <code>feed</code> function is what <a href="#dialect.feed.example" title="Example 8.7. Using urllister.py">does the entire transformation</a>. You had the entire <abbr>HTML</abbr> source in a single string, so you only had to call <code>feed</code> once. However, you can call <code>feed</code> as often as you want, and the parser will just keep parsing. So if you were worried about memory usage (or you knew you
+            were going to be dealing with very large <abbr>HTML</abbr> pages), you could set this up in a loop, where you read a few bytes of <abbr>HTML</abbr> and fed it to the parser. The result would be the same.
 <li>Because <code>feed</code> maintains an internal buffer, you should always call the parser's <code>close</code> method when you're done (even if you fed it all at once, like you did). Otherwise you may find that your output is missing
             the last few bytes.
 <li>Remember, <code>output</code> is the function you defined on <code>BaseHTMLProcessor</code> that <a href="#dialect.output.example" title="Example 8.9. BaseHTMLProcessor output">joins all the pieces of output you've buffered</a> and returns them in a single string.
-<p>And just like that, you've &#8220;translated&#8221; a web page, given nothing but a <acronym>URL</acronym> and the name of a dialect.
+<p>And just like that, you've &#8220;translated&#8221; a web page, given nothing but a <abbr>URL</abbr> and the name of a dialect.
 <div class=itemizedlist>
 <h3>Further reading</h3>
 <ul>
@@ -3619,14 +3619,14 @@ appropriately-named file in the plug-ins directory (like <code>foodialect.py</co
 
 </ul>
 <h2 id="dialect.summary">8.10. Summary</h2>
-<p>Python provides you with a powerful tool, <code>sgmllib.py</code>, to manipulate <acronym>HTML</acronym> by turning its structure into an object model. You can use this tool in many different ways.
+<p>Python provides you with a powerful tool, <code>sgmllib.py</code>, to manipulate <abbr>HTML</abbr> by turning its structure into an object model. You can use this tool in many different ways.
 <div class=itemizedlist>
 <ul>
-<li>parsing the <acronym>HTML</acronym> looking for something specific
+<li>parsing the <abbr>HTML</abbr> looking for something specific
 
-<li>aggregating the results, like the <a href="#dialect.extract.links" title="Example 8.6. Introducing urllister.py"><acronym>URL</acronym> lister</a>
+<li>aggregating the results, like the <a href="#dialect.extract.links" title="Example 8.6. Introducing urllister.py"><abbr>URL</abbr> lister</a>
 <li>altering the structure along the way, like the <a href="#dialect.quoting.example" title="Example 8.16. Quoting attribute values">attribute quoter</a>
-<li>transforming the <acronym>HTML</acronym> into something else by manipulating the text while leaving the tags alone, like the <a href="#dialect.dialectizer" title="8.8. Introducing dialect.py"><code>Dialectizer</code></a>
+<li>transforming the <abbr>HTML</abbr> into something else by manipulating the text while leaving the tags alone, like the <a href="#dialect.dialectizer" title="8.8. Introducing dialect.py"><code>Dialectizer</code></a>
 </ul>
 <p>Along with these examples, you should be comfortable doing all of the following things:
 <div class=itemizedlist>
@@ -3638,7 +3638,7 @@ appropriately-named file in the plug-ins directory (like <code>foodialect.py</co
 </ul>
 <div class=footnotes><br><hr width="100" align="left">
 <div class=footnote>
-<p><sup>[<a name="ftn.d0e20503" href="#d0e20503">1</a>] </sup>The technical term for a parser like <code>SGMLParser</code> is a <em>consumer</em>: it consumes <acronym>HTML</acronym> and breaks it down. Presumably, the name <code>feed</code> was chosen to fit into the whole &#8220;consumer&#8221; motif. Personally, it makes me think of an exhibit in the zoo where there's just a dark cage with no trees or plants or
+<p><sup>[<a name="ftn.d0e20503" href="#d0e20503">1</a>] </sup>The technical term for a parser like <code>SGMLParser</code> is a <em>consumer</em>: it consumes <abbr>HTML</abbr> and breaks it down. Presumably, the name <code>feed</code> was chosen to fit into the whole &#8220;consumer&#8221; motif. Personally, it makes me think of an exhibit in the zoo where there's just a dark cage with no trees or plants or
    evidence of life of any kind, but if you stand perfectly still and look really closely you can make out two beady eyes staring
    back at you from the far left corner, but you convince yourself that that's just your mind playing tricks on you, and the
    only way you can tell that the whole thing isn't just an empty cage is a small innocuous sign on the railing that reads, &#8220;Do not feed the parser.&#8221;  But maybe that's just me. In any event, it's an interesting mental image.
@@ -3650,18 +3650,18 @@ appropriately-named file in the plug-ins directory (like <code>foodialect.py</co
 <div class=footnote>
 <p><sup>[<a name="ftn.d0e21226" href="#d0e21226">3</a>] </sup>I don't get out much.
 <div class=footnote>
-<p><sup>[<a name="ftn.d0e21764" href="#d0e21764">4</a>] </sup>All right, it's not that common a question. It's not up there with &#8220;What editor should I use to write Python code?&#8221; (answer: Emacs) or &#8220;Is Python better or worse than Perl?&#8221; (answer: &#8220;Perl is worse than Python because people wanted it worse.&#8221; -Larry Wall, 10/14/1998)  But questions about <acronym>HTML</acronym> processing pop up in one form or another about once a month, and among those questions, this is a popular one.
+<p><sup>[<a name="ftn.d0e21764" href="#d0e21764">4</a>] </sup>All right, it's not that common a question. It's not up there with &#8220;What editor should I use to write Python code?&#8221; (answer: Emacs) or &#8220;Is Python better or worse than Perl?&#8221; (answer: &#8220;Perl is worse than Python because people wanted it worse.&#8221; -Larry Wall, 10/14/1998)  But questions about <abbr>HTML</abbr> processing pop up in one form or another about once a month, and among those questions, this is a popular one.
 <div class=chapter>
-<h2 id="kgp">Chapter 9. <acronym>XML</acronym> Processing</h2>
+<h2 id="kgp">Chapter 9. <abbr>XML</abbr> Processing</h2>
 <h2 id="kgp.divein">9.1. Diving in</h2>
-<p>These next two chapters are about <acronym>XML</acronym> processing in Python. It would be helpful if you already knew what an <acronym>XML</acronym> document looks like, that it's made up of structured tags to form a hierarchy of elements, and so on. If this doesn't make
-sense to you, there are <a href="http://directory.google.com/Top/Computers/Data_Formats/Markup_Languages/XML/Resources/FAQs,_Help,_and_Tutorials/">many <acronym>XML</acronym> tutorials</a> that can explain the basics.
+<p>These next two chapters are about <abbr>XML</abbr> processing in Python. It would be helpful if you already knew what an <abbr>XML</abbr> document looks like, that it's made up of structured tags to form a hierarchy of elements, and so on. If this doesn't make
+sense to you, there are <a href="http://directory.google.com/Top/Computers/Data_Formats/Markup_Languages/XML/Resources/FAQs,_Help,_and_Tutorials/">many <abbr>XML</abbr> tutorials</a> that can explain the basics.
 <p>If you're not particularly interested in XML, you should still read these chapters, which cover important topics like Python packages, Unicode, command line arguments, and how to use <code>getattr</code> for method dispatching.
 <p>Being a philosophy major is not required, although if you have ever had the misfortune of being subjected to the writings
 of Immanuel Kant, you will appreciate the example program a lot more than if you majored in something useful, like computer
 science.
-<p>There are two basic ways to work with <acronym>XML</acronym>. One is called <acronym>SAX</acronym> (&#8220;Simple <acronym>API</acronym> for <acronym>XML</acronym>&#8221;), and it works by reading the <acronym>XML</acronym> a little bit at a time and calling a method for each element it finds. (If you read <a href="#dialect" title="Chapter 8. HTML Processing">Chapter 8, <i>HTML Processing</i></a>, this should sound familiar, because that's how the <code>sgmllib</code> module works.)  The other is called <acronym>DOM</acronym> (&#8220;Document Object Model&#8221;), and it works by reading in the entire <acronym>XML</acronym> document at once and creating an internal representation of it using native Python classes linked in a tree structure. Python has standard modules for both kinds of parsing, but this chapter will only deal with using the <acronym>DOM</acronym>.
-<p>The following is a complete Python program which generates pseudo-random output based on a context-free grammar defined in an <acronym>XML</acronym> format. Don't worry yet if you don't understand what that means; you'll examine both the program's input and its output
+<p>There are two basic ways to work with <abbr>XML</abbr>. One is called <abbr>SAX</abbr> (&#8220;Simple <abbr>API</abbr> for <abbr>XML</abbr>&#8221;), and it works by reading the <abbr>XML</abbr> a little bit at a time and calling a method for each element it finds. (If you read <a href="#dialect" title="Chapter 8. HTML Processing">Chapter 8, <i>HTML Processing</i></a>, this should sound familiar, because that's how the <code>sgmllib</code> module works.)  The other is called <abbr>DOM</abbr> (&#8220;Document Object Model&#8221;), and it works by reading in the entire <abbr>XML</abbr> document at once and creating an internal representation of it using native Python classes linked in a tree structure. Python has standard modules for both kinds of parsing, but this chapter will only deal with using the <abbr>DOM</abbr>.
+<p>The following is a complete Python program which generates pseudo-random output based on a context-free grammar defined in an <abbr>XML</abbr> format. Don't worry yet if you don't understand what that means; you'll examine both the program's input and its output
 in more depth throughout these next two chapters.
 <div class=example><h3>Example 9.1. <code>kgp.py</code></h3>
 <p>If you have not already done so, you can <a href="http://diveintopython3.org/download/diveintopython3-examples-5.4.zip" title="Download example scripts">download this and other examples</a> used in this book.
@@ -3953,7 +3953,7 @@ def openAnything(source):
     # treat source as string
     import StringIO     
     return StringIO.StringIO(str(source)) 
-</pre><p>Run the program <code>kgp.py</code> by itself, and it will parse the default <acronym>XML</acronym>-based grammar, in <code>kant.xml</code>, and print several paragraphs worth of philosophy in the style of Immanuel Kant.
+</pre><p>Run the program <code>kgp.py</code> by itself, and it will parse the default <abbr>XML</abbr>-based grammar, in <code>kant.xml</code>, and print several paragraphs worth of philosophy in the style of Immanuel Kant.
 <div class=example><h3>Example 9.3. Sample output of <code>kgp.py</code></h3><pre class=screen><samp class=prompt>[you@localhost kgp]$ python kgp.py</samp>
 <samp>     As is shown in the writings of Hume, our a priori concepts, in
 reference to ends, abstract from all content of knowledge; in the study
@@ -4001,9 +4001,9 @@ completely different.
 10110100</pre><p>You will take a closer look at the structure of the grammar file later in this chapter. For now, all you need to know is
 that the grammar file defines the structure of the output, and the <code>kgp.py</code> program reads through the grammar and makes random decisions about which words to plug in where.
 <h2 id="kgp.packages">9.2. Packages</h2>
-<p>Actually parsing an <acronym>XML</acronym> document is very simple: one line of code. However, before you get to that line of code, you need to take a short detour
+<p>Actually parsing an <abbr>XML</abbr> document is very simple: one line of code. However, before you get to that line of code, you need to take a short detour
    to talk about packages.
-<div class=example><h3>Example 9.5. Loading an <acronym>XML</acronym> document (a sneak peek)</h3><pre class=screen>
+<div class=example><h3>Example 9.5. Loading an <abbr>XML</abbr> document (a sneak peek)</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>from xml.dom import minidom</kbd> <span>&#x2460;</span>
 <samp class=prompt>>>> </samp>xmldoc = minidom.parse('~/diveintopython3/common/py/kgp/binary.xml')</pre><div class=calloutlist>
 <ol>
@@ -4052,13 +4052,13 @@ The answer is the magical <code>__init__.py</code> file. You see, packages are n
 
 <td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">A package is a directory with the special <code>__init__.py</code> file in it. The <code>__init__.py</code> file defines the attributes and methods of the package. It doesn't need to define anything; it can just be an empty file,
       but it has to exist. But if <code>__init__.py</code> doesn't exist, the directory is just a directory, not a package, and it can't be imported or contain modules or nested packages.
-<p>So why bother with packages?  Well, they provide a way to logically group related modules. Instead of having an <code>xml</code> package with <code>sax</code> and <code>dom</code> packages inside, the authors could have chosen to put all the <code>sax</code> functionality in <code>xmlsax.py</code> and all the <code>dom</code> functionality in <code>xmldom.py</code>, or even put all of it in a single module. But that would have been unwieldy (as of this writing, the <acronym>XML</acronym> package has over 3000 lines of code) and difficult to manage (separate source files mean multiple people can work on different
+<p>So why bother with packages?  Well, they provide a way to logically group related modules. Instead of having an <code>xml</code> package with <code>sax</code> and <code>dom</code> packages inside, the authors could have chosen to put all the <code>sax</code> functionality in <code>xmlsax.py</code> and all the <code>dom</code> functionality in <code>xmldom.py</code>, or even put all of it in a single module. But that would have been unwieldy (as of this writing, the <abbr>XML</abbr> package has over 3000 lines of code) and difficult to manage (separate source files mean multiple people can work on different
 areas simultaneously).
 <p>If you ever find yourself writing a large subsystem in Python (or, more likely, when you realize that your small subsystem has grown into a large one), invest some time designing a good
 package architecture. It's one of the many things Python is good at, so take advantage of it.
-<h2 id="kgp.parse">9.3. Parsing <acronym>XML</acronym></h2>
-<p>As I was saying, actually parsing an <acronym>XML</acronym> document is very simple: one line of code. Where you go from there is up to you.
-<div class=example><h3>Example 9.8. Loading an <acronym>XML</acronym> document (for real this time)</h3><pre class=screen>
+<h2 id="kgp.parse">9.3. Parsing <abbr>XML</abbr></h2>
+<p>As I was saying, actually parsing an <abbr>XML</abbr> document is very simple: one line of code. Where you go from there is up to you.
+<div class=example><h3>Example 9.8. Loading an <abbr>XML</abbr> document (for real this time)</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>from xml.dom import minidom</kbd>      <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse('~/diveintopython3/common/py/kgp/binary.xml')</kbd>  <span>&#x2461;</span>
 <samp class=prompt>>>> </samp><kbd>xmldoc</kbd>         <span>&#x2462;</span>
@@ -4077,11 +4077,11 @@ package architecture. It's one of the many things Python is good at, so take adv
 &lt;/grammar></span></pre><div class=calloutlist>
 <ol>
 <li>As you saw in the <a href="#kgp.packages" title="9.2. Packages">previous section</a>, this imports the <code>minidom</code> module from the <code>xml.dom</code> package.
-<li>Here is the one line of code that does all the work: <code>minidom.parse</code> takes one argument and returns a parsed representation of the <acronym>XML</acronym> document. The argument can be many things; in this case, it's simply a filename of an <acronym>XML</acronym> document on my local disk. (To follow along, you'll need to change the path to point to your downloaded examples directory.)
+<li>Here is the one line of code that does all the work: <code>minidom.parse</code> takes one argument and returns a parsed representation of the <abbr>XML</abbr> document. The argument can be many things; in this case, it's simply a filename of an <abbr>XML</abbr> document on my local disk. (To follow along, you'll need to change the path to point to your downloaded examples directory.)
              But you can also pass a <a href="#fileinfo.files" title="6.2. Working with File Objects">file object</a>, or even a <a href="#dialect.extract.urllib" title="Example 8.5. Introducing urllib">file-like object</a>. You'll take advantage of this flexibility later in this chapter.
-<li>The object returned from <code>minidom.parse</code> is a <code>Document</code> object, a descendant of the <code>Node</code> class. This <code>Document</code> object is the root level of a complex tree-like structure of interlocking Python objects that completely represent the <acronym>XML</acronym> document you passed to <code>minidom.parse</code>.
-<li><code>toxml</code> is a method of the <code>Node</code> class (and is therefore available on the <code>Document</code> object you got from <code>minidom.parse</code>). <code>toxml</code> prints out the <acronym>XML</acronym> that this <code>Node</code> represents. For the <code>Document</code> node, this prints out the entire <acronym>XML</acronym> document.
-<p>Now that you have an <acronym>XML</acronym> document in memory, you can start traversing through it.
+<li>The object returned from <code>minidom.parse</code> is a <code>Document</code> object, a descendant of the <code>Node</code> class. This <code>Document</code> object is the root level of a complex tree-like structure of interlocking Python objects that completely represent the <abbr>XML</abbr> document you passed to <code>minidom.parse</code>.
+<li><code>toxml</code> is a method of the <code>Node</code> class (and is therefore available on the <code>Document</code> object you got from <code>minidom.parse</code>). <code>toxml</code> prints out the <abbr>XML</abbr> that this <code>Node</code> represents. For the <code>Document</code> node, this prints out the entire <abbr>XML</abbr> document.
+<p>Now that you have an <abbr>XML</abbr> document in memory, you can start traversing through it.
 <div class=example><h3 id="kgp.parse.gettingchildnodes.example">Example 9.9. Getting child nodes</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>xmldoc.childNodes</kbd>    <span>&#x2460;</span>
 [&lt;DOM Element: grammar at 17538908>]
@@ -4090,7 +4090,7 @@ package architecture. It's one of the many things Python is good at, so take adv
 <samp class=prompt>>>> </samp><kbd>xmldoc.firstChild</kbd>    <span>&#x2462;</span>
 &lt;DOM Element: grammar at 17538908></pre><div class=calloutlist>
 <ol>
-<li>Every <code>Node</code> has a <code>childNodes</code> attribute, which is a list of the <code>Node</code> objects. A <code>Document</code> always has only one child node, the root element of the <acronym>XML</acronym> document (in this case, the <code>grammar</code> element).
+<li>Every <code>Node</code> has a <code>childNodes</code> attribute, which is a list of the <code>Node</code> objects. A <code>Document</code> always has only one child node, the root element of the <abbr>XML</abbr> document (in this case, the <code>grammar</code> element).
 <li>To get the first (and in this case, the only) child node, just use regular list syntax. Remember, there is nothing special
             going on here; this is just a regular Python list of regular Python objects.
 <li>Since getting the first child node of a node is a useful and common activity, the <code>Node</code> class has a <code>firstChild</code> attribute, which is synonymous with <code>childNodes[0]</code>. (There is also a <code>lastChild</code> attribute, which is synonymous with <code>childNodes[-1]</code>.)
@@ -4108,7 +4108,7 @@ package architecture. It's one of the many things Python is good at, so take adv
 &lt;/ref>
 &lt;/grammar></span></pre><div class=calloutlist>
 <ol>
-<li>Since the <code>toxml</code> method is defined in the <code>Node</code> class, it is available on any <acronym>XML</acronym> node, not just the <code>Document</code> element.
+<li>Since the <code>toxml</code> method is defined in the <code>Node</code> class, it is available on any <abbr>XML</abbr> node, not just the <code>Document</code> element.
 <div class=example><h3 id="kgp.parse.childnodescanbetext.example">Example 9.11. Child nodes can be text</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>grammarNode.childNodes</kbd><span>&#x2460;</span>
 <samp>[&lt;DOM Text node "\n">, &lt;DOM Element: ref at 17533332>, \
@@ -4132,7 +4132,7 @@ package architecture. It's one of the many things Python is good at, so take adv
 
 </span></pre><div class=calloutlist>
 <ol>
-<li>Looking at the <acronym>XML</acronym> in <code>binary.xml</code>, you might think that the <code>grammar</code> has only two child nodes, the two <code>ref</code> elements. But you're missing something: the carriage returns!  After the <code>'&lt;grammar>'</code> and before the first <code>'&lt;ref>'</code> is a carriage return, and this text counts as a child node of the <code>grammar</code> element. Similarly, there is a carriage return after each <code>'&lt;/ref>'</code>; these also count as child nodes. So <code>grammar.childNodes</code> is actually a list of 5 objects: 3 <code>Text</code> objects and 2 <code>Element</code> objects.
+<li>Looking at the <abbr>XML</abbr> in <code>binary.xml</code>, you might think that the <code>grammar</code> has only two child nodes, the two <code>ref</code> elements. But you're missing something: the carriage returns!  After the <code>'&lt;grammar>'</code> and before the first <code>'&lt;ref>'</code> is a carriage return, and this text counts as a child node of the <code>grammar</code> element. Similarly, there is a carriage return after each <code>'&lt;/ref>'</code>; these also count as child nodes. So <code>grammar.childNodes</code> is actually a list of 5 objects: 3 <code>Text</code> objects and 2 <code>Element</code> objects.
 <li>The first child is a <code>Text</code> object representing the carriage return after the <code>'&lt;grammar>'</code> tag and before the first <code>'&lt;ref>'</code> tag.
 <li>The second child is an <code>Element</code> object representing the first <code>ref</code> element.
 <li>The fourth child is an <code>Element</code> object representing the second <code>ref</code> element.
@@ -4163,7 +4163,7 @@ u'0'</pre><div class=calloutlist>
 <li>The <code>p</code> element has only one child node (you can't tell that from this example, but look at <code>pNode.childNodes</code> if you don't believe me), and it is a <code>Text</code> node for the single character <code>'0'</code>.
 <li>The <code>.data</code> attribute of a <code>Text</code> node gives you the actual string that the text node represents. But what is that <code>'u'</code> in front of the string?  The answer to that deserves its own section.
 <h2 id="kgp.unicode">9.4. Unicode</h2>
-<p>Unicode is a system to represent characters from all the world's different languages. When Python parses an <acronym>XML</acronym> document, all data is stored in memory as unicode.
+<p>Unicode is a system to represent characters from all the world's different languages. When Python parses an <abbr>XML</abbr> document, all data is stored in memory as unicode.
 <p>You'll get to all that in a minute, but first, some background.
 <p><b>Historical note. </b>Before unicode, there were separate character encoding systems for each language, each using the same numbers (0-255) to represent
 that language's characters. Some languages (like Russian) have multiple conflicting standards about how to represent the
@@ -4179,14 +4179,14 @@ mode, so character 241 means something else. And so on.)  These are the problems
 <sup>[<a name="d0e23786" href="#ftn.d0e23786">5</a>]</sup>  Each 2-byte number represents a unique character used in at least one of the world's languages. (Characters that are used
 in multiple languages have the same numeric code.)  There is exactly 1 number per character, and exactly 1 character per number.
 Unicode data is never ambiguous.
-<p>Of course, there is still the matter of all these legacy encoding systems. 7-bit <acronym>ASCII</acronym>, for instance, which stores English characters as numbers ranging from 0 to 127. (65 is capital &#8220;<code>A</code>&#8221;, 97 is lowercase &#8220;<code>a</code>&#8221;, and so forth.)  English has a very simple alphabet, so it can be completely expressed in 7-bit <acronym>ASCII</acronym>. Western European languages like French, Spanish, and German all use an encoding system called ISO-8859-1 (also called &#8220;latin-1&#8221;), which uses the 7-bit <acronym>ASCII</acronym> characters for the numbers 0 through 127, but then extends into the 128-255 range for characters like n-with-a-tilde-over-it
-(241), and u-with-two-dots-over-it (252). And unicode uses the same characters as 7-bit <acronym>ASCII</acronym> for 0 through 127, and the same characters as ISO-8859-1 for 128 through 255, and then extends from there into characters
+<p>Of course, there is still the matter of all these legacy encoding systems. 7-bit <abbr>ASCII</abbr>, for instance, which stores English characters as numbers ranging from 0 to 127. (65 is capital &#8220;<code>A</code>&#8221;, 97 is lowercase &#8220;<code>a</code>&#8221;, and so forth.)  English has a very simple alphabet, so it can be completely expressed in 7-bit <abbr>ASCII</abbr>. Western European languages like French, Spanish, and German all use an encoding system called ISO-8859-1 (also called &#8220;latin-1&#8221;), which uses the 7-bit <abbr>ASCII</abbr> characters for the numbers 0 through 127, but then extends into the 128-255 range for characters like n-with-a-tilde-over-it
+(241), and u-with-two-dots-over-it (252). And unicode uses the same characters as 7-bit <abbr>ASCII</abbr> for 0 through 127, and the same characters as ISO-8859-1 for 128 through 255, and then extends from there into characters
 for other languages with the remaining numbers, 256 through 65535.
 <p>When dealing with unicode data, you may at some point need to convert the data back into one of these other legacy encoding
 systems. For instance, to integrate with some other computer system which expects its data in a specific 1-byte encoding
-scheme, or to print it to a non-unicode-aware terminal or printer. Or to store it in an <acronym>XML</acronym> document which explicitly specifies the encoding scheme.
+scheme, or to print it to a non-unicode-aware terminal or printer. Or to store it in an <abbr>XML</abbr> document which explicitly specifies the encoding scheme.
 <p>And on that note, let's get back to Python.
-<p>Python has had unicode support throughout the language since version 2.0. The <acronym>XML</acronym> package uses unicode to store all parsed <acronym>XML</acronym> data, but you can use unicode anywhere.
+<p>Python has had unicode support throughout the language since version 2.0. The <abbr>XML</abbr> package uses unicode to store all parsed <abbr>XML</abbr> data, but you can use unicode anywhere.
 <div class=example><h3>Example 9.13. Introducing unicode</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>s = u'Dive in'</kbd>            <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>s</kbd>
@@ -4194,9 +4194,9 @@ u'Dive in'
 <samp class=prompt>>>> </samp><kbd>print s</kbd> <span>&#x2461;</span>
 Dive in</pre><div class=calloutlist>
 <ol>
-<li>To create a unicode string instead of a regular <acronym>ASCII</acronym> string, add the letter &#8220;<code>u</code>&#8221; before the string. Note that this particular string doesn't have any non-<acronym>ASCII</acronym> characters. That's fine; unicode is a superset of <acronym>ASCII</acronym> (a very large superset at that), so any regular <acronym>ASCII</acronym> string can also be stored as unicode.
-<li>When printing a string, Python will attempt to convert it to your default encoding, which is usually <acronym>ASCII</acronym>. (More on this in a minute.)  Since this unicode string is made up of characters that are also <acronym>ASCII</acronym> characters, printing it has the same result as printing a normal <acronym>ASCII</acronym> string; the conversion is seamless, and if you didn't know that <var>s</var> was a unicode string, you'd never notice the difference.
-<div class=example><h3>Example 9.14. Storing non-<acronym>ASCII</acronym> characters</h3><pre class=screen>
+<li>To create a unicode string instead of a regular <abbr>ASCII</abbr> string, add the letter &#8220;<code>u</code>&#8221; before the string. Note that this particular string doesn't have any non-<abbr>ASCII</abbr> characters. That's fine; unicode is a superset of <abbr>ASCII</abbr> (a very large superset at that), so any regular <abbr>ASCII</abbr> string can also be stored as unicode.
+<li>When printing a string, Python will attempt to convert it to your default encoding, which is usually <abbr>ASCII</abbr>. (More on this in a minute.)  Since this unicode string is made up of characters that are also <abbr>ASCII</abbr> characters, printing it has the same result as printing a normal <abbr>ASCII</abbr> string; the conversion is seamless, and if you didn't know that <var>s</var> was a unicode string, you'd never notice the difference.
+<div class=example><h3>Example 9.14. Storing non-<abbr>ASCII</abbr> characters</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>s = u'La Pe\xf1a'</kbd>         <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>print s</kbd> <span>&#x2461;</span>
 <samp class=traceback>Traceback (innermost last):
@@ -4205,11 +4205,11 @@ UnicodeError: ASCII encoding error: ordinal not in range(128)</samp>
 <samp class=prompt>>>> </samp><kbd>print s.encode('latin-1')</kbd> <span>&#x2462;</span>
 La Pe&ntilde;a</pre><div class=calloutlist>
 <ol>
-<li>The real advantage of unicode, of course, is its ability to store non-<acronym>ASCII</acronym> characters, like the Spanish &#8220;<code>&ntilde;</code>&#8221; (<code>n</code> with a tilde over it). The unicode character code for the tilde-n is <code>0xf1</code> in hexadecimal (241 in decimal), which you can type like this: <code>\xf1</code>.
-<li>Remember I said that the <code>print</code> function attempts to convert a unicode string to <acronym>ASCII</acronym> so it can print it?  Well, that's not going to work here, because your unicode string contains non-<acronym>ASCII</acronym> characters, so Python raises a <samp>UnicodeError</samp> error.
+<li>The real advantage of unicode, of course, is its ability to store non-<abbr>ASCII</abbr> characters, like the Spanish &#8220;<code>&ntilde;</code>&#8221; (<code>n</code> with a tilde over it). The unicode character code for the tilde-n is <code>0xf1</code> in hexadecimal (241 in decimal), which you can type like this: <code>\xf1</code>.
+<li>Remember I said that the <code>print</code> function attempts to convert a unicode string to <abbr>ASCII</abbr> so it can print it?  Well, that's not going to work here, because your unicode string contains non-<abbr>ASCII</abbr> characters, so Python raises a <samp>UnicodeError</samp> error.
 <li>Here's where the conversion-from-unicode-to-other-encoding-schemes comes in. <var>s</var> is a unicode string, but <code>print</code> can only print a regular string. To solve this problem, you call the <code>encode</code> method, available on every unicode string, to convert the unicode string to a regular string in the given encoding scheme,
-            which you pass as a parameter. In this case, you're using <code>latin-1</code> (also known as <code>iso-8859-1</code>), which includes the tilde-n (whereas the default <acronym>ASCII</acronym> encoding scheme did not, since it only includes characters numbered 0 through 127).
-<p>Remember I said Python usually converted unicode to <acronym>ASCII</acronym> whenever it needed to make a regular string out of a unicode string?  Well, this default encoding scheme is an option which
+            which you pass as a parameter. In this case, you're using <code>latin-1</code> (also known as <code>iso-8859-1</code>), which includes the tilde-n (whereas the default <abbr>ASCII</abbr> encoding scheme did not, since it only includes characters numbered 0 through 127).
+<p>Remember I said Python usually converted unicode to <abbr>ASCII</abbr> whenever it needed to make a regular string out of a unicode string?  Well, this default encoding scheme is an option which
 you can customize.
 <div class=example><h3>Example 9.15. <code>sitecustomize.py</code></h3><pre><code>
 # sitecustomize.py <span>&#x2460;</span>
@@ -4237,15 +4237,15 @@ La Pe&ntilde;a</pre><div class=calloutlist>
 <p>If you are going to be storing non-ASCII strings within your Python code, you'll need to specify the encoding of each individual <code>.py</code> file by putting an encoding declaration at the top of each file. This declaration defines the <code>.py</code> file to be UTF-8:<pre><code>
 #!/usr/bin/env python
 # -*- coding: UTF-8 -*-
-</pre><p>Now, what about <acronym>XML</acronym>?  Well, every <acronym>XML</acronym> document is in a specific encoding. Again, ISO-8859-1 is a popular encoding for data in Western European languages. KOI8-R
-is popular for Russian texts. The encoding, if specified, is in the header of the <acronym>XML</acronym> document.
+</pre><p>Now, what about <abbr>XML</abbr>?  Well, every <abbr>XML</abbr> document is in a specific encoding. Again, ISO-8859-1 is a popular encoding for data in Western European languages. KOI8-R
+is popular for Russian texts. The encoding, if specified, is in the header of the <abbr>XML</abbr> document.
 <div class=example><h3>Example 9.18. <code>russiansample.xml</code></h3><pre class=screen><samp>
 &lt;?xml version="1.0" encoding="koi8-r"?>       </span><span>&#x2460;</span><samp>
 &lt;preface>
 &lt;title>&#1055;&#1088;&#1077;&#1076;&#1080;&#1089;&#1083;&#1086;&#1074;&#1080;&#1077;&lt;/title>  </span><span>&#x2461;</span><samp>
 &lt;/preface></span></pre><div class=calloutlist>
 <ol>
-<li>This is a sample extract from a real Russian <acronym>XML</acronym> document; it's part of a Russian translation of this very book. Note the encoding, <code>koi8-r</code>, specified in the header.
+<li>This is a sample extract from a real Russian <abbr>XML</abbr> document; it's part of a Russian translation of this very book. Note the encoding, <code>koi8-r</code>, specified in the header.
 <li>These are Cyrillic characters which, as far as I know, spell the Russian word for &#8220;Preface&#8221;. If you open this file in a regular text editor, the characters will most likely like gibberish, because they're encoded
             using the <code>koi8-r</code> encoding scheme, but they're being displayed in <code>iso-8859-1</code>.
 <div class=example><h3>Example 9.19. Parsing <code>russiansample.xml</code></h3><pre class=screen>
@@ -4267,26 +4267,26 @@ UnicodeError: ASCII encoding error: ordinal not in range(128)</samp>
 <li>I'm assuming here that you saved the previous example as <code>russiansample.xml</code> in the current directory. I am also, for the sake of completeness, assuming that you've changed your default encoding back
             to <code>'ascii'</code> by removing your <code>sitecustomize.py</code> file, or at least commenting out the <code>setdefaultencoding</code> line.
 <li>Note that the text data of the <code>title</code> tag (now in the <var>title</var> variable, thanks to that long concatenation of Python functions which I hastily skipped over and, annoyingly, won't explain until the next section) -- the text data inside the
-<acronym>XML</acronym> document's <code>title</code> element is stored in unicode.
-<li>Printing the title is not possible, because this unicode string contains non-<acronym>ASCII</acronym> characters, so Python can't convert it to <acronym>ASCII</acronym> because that doesn't make sense.
+<abbr>XML</abbr> document's <code>title</code> element is stored in unicode.
+<li>Printing the title is not possible, because this unicode string contains non-<abbr>ASCII</abbr> characters, so Python can't convert it to <abbr>ASCII</abbr> because that doesn't make sense.
 <li>You can, however, explicitly convert it to <code>koi8-r</code>, in which case you get a (regular, not unicode) string of single-byte characters (<code>f0</code>, <code>d2</code>, <code>c5</code>, and so forth) that are the <code>koi8-r</code>-encoded versions of the characters in the original unicode string.
-<li>Printing the <code>koi8-r</code>-encoded string will probably show gibberish on your screen, because your Python <acronym>IDE</acronym> is interpreting those characters as <code>iso-8859-1</code>, not <code>koi8-r</code>. But at least they do print. (And, if you look carefully, it's the same gibberish that you saw when you opened the original
-<acronym>XML</acronym> document in a non-unicode-aware text editor. Python converted it from <code>koi8-r</code> into unicode when it parsed the <acronym>XML</acronym> document, and you've just converted it back.)
+<li>Printing the <code>koi8-r</code>-encoded string will probably show gibberish on your screen, because your Python <abbr>IDE</abbr> is interpreting those characters as <code>iso-8859-1</code>, not <code>koi8-r</code>. But at least they do print. (And, if you look carefully, it's the same gibberish that you saw when you opened the original
+<abbr>XML</abbr> document in a non-unicode-aware text editor. Python converted it from <code>koi8-r</code> into unicode when it parsed the <abbr>XML</abbr> document, and you've just converted it back.)
 <p>To sum up, unicode itself is a bit intimidating if you've never seen it before, but unicode data is really very easy to handle
-in Python. If your <acronym>XML</acronym> documents are all 7-bit <acronym>ASCII</acronym> (like the examples in this chapter), you will literally never think about unicode. Python will convert the <acronym>ASCII</acronym> data in the <acronym>XML</acronym> documents into unicode while parsing, and auto-coerce it back to <acronym>ASCII</acronym> whenever necessary, and you'll never even notice. But if you need to deal with that in other languages, Python is ready.
+in Python. If your <abbr>XML</abbr> documents are all 7-bit <abbr>ASCII</abbr> (like the examples in this chapter), you will literally never think about unicode. Python will convert the <abbr>ASCII</abbr> data in the <abbr>XML</abbr> documents into unicode while parsing, and auto-coerce it back to <abbr>ASCII</abbr> whenever necessary, and you'll never even notice. But if you need to deal with that in other languages, Python is ready.
 <div class=itemizedlist>
 <h3>Further reading</h3>
 <ul>
 <li><a href="http://www.unicode.org/">Unicode.org</a> is the home page of the unicode standard, including a brief <a href="http://www.unicode.org/standard/principles.html">technical introduction</a>.
 
-<li><a href="http://www.reportlab.com/i18n/python_unicode_tutorial.html">Unicode Tutorial</a> has some more examples of how to use Python's unicode functions, including how to force Python to coerce unicode into <acronym>ASCII</acronym> even when it doesn't really want to.
+<li><a href="http://www.reportlab.com/i18n/python_unicode_tutorial.html">Unicode Tutorial</a> has some more examples of how to use Python's unicode functions, including how to force Python to coerce unicode into <abbr>ASCII</abbr> even when it doesn't really want to.
 
 <li><a href="http://www.python.org/peps/pep-0263.html">PEP 263</a> goes into more detail about how and when to define a character encoding in your <code>.py</code> files.
 
 </ul>
 <h2 id="kgp.search">9.5. Searching for elements</h2>
-<p>Traversing <acronym>XML</acronym> documents by stepping through each node can be tedious. If you're looking for something in particular, buried deep within
-   your <acronym>XML</acronym> document, there is a shortcut you can use to find it quickly: <code>getElementsByTagName</code>.
+<p>Traversing <abbr>XML</abbr> documents by stepping through each node can be tedious. If you're looking for something in particular, buried deep within
+   your <abbr>XML</abbr> document, there is a shortcut you can use to find it quickly: <code>getElementsByTagName</code>.
 <p>For this section, you'll be using the <code>binary.xml</code> grammar file, which looks like this:
 <div class=example><h3>Example 9.20. <code>binary.xml</code></h3><pre class=screen><samp>&lt;?xml version="1.0"?>
 &lt;!DOCTYPE grammar PUBLIC "-//diveintopython3.org//DTD Kant Generator Pro v1.0//EN" "kgp.dtd">
@@ -4318,7 +4318,7 @@ in Python. If your <acronym>XML</acronym> documents are all 7-bit <acronym>ASCII
 &lt;/ref>
 </span></pre><div class=calloutlist>
 <ol>
-<li><code>getElementsByTagName</code> takes one argument, the name of the element you wish to find. It returns a list of <code>Element</code> objects, corresponding to the <acronym>XML</acronym> elements that have that name. In this case, you find two <code>ref</code> elements.
+<li><code>getElementsByTagName</code> takes one argument, the name of the element you wish to find. It returns a list of <code>Element</code> objects, corresponding to the <abbr>XML</abbr> elements that have that name. In this case, you find two <code>ref</code> elements.
 <div class=example><h3>Example 9.22. Every element is searchable</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>firstref = reflist[0]</kbd>    <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>print firstref.toxml()</kbd>
@@ -4349,15 +4349,15 @@ in Python. If your <acronym>XML</acronym> documents are all 7-bit <acronym>ASCII
 <samp>'&lt;p>&lt;xref id="bit"/>&lt;xref id="bit"/>&lt;xref id="bit"/>&lt;xref id="bit"/>\
 &lt;xref id="bit"/>&lt;xref id="bit"/>&lt;xref id="bit"/>&lt;xref id="bit"/>&lt;/p>'</span></pre><div class=calloutlist>
 <ol>
-<li>Note carefully the difference between this and the previous example. Previously, you were searching for <code>p</code> elements within <var>firstref</var>, but here you are searching for <code>p</code> elements within <var>xmldoc</var>, the root-level object that represents the entire <acronym>XML</acronym> document. This <em>does</em> find the <code>p</code> elements nested within the <code>ref</code> elements within the root <code>grammar</code> element.
+<li>Note carefully the difference between this and the previous example. Previously, you were searching for <code>p</code> elements within <var>firstref</var>, but here you are searching for <code>p</code> elements within <var>xmldoc</var>, the root-level object that represents the entire <abbr>XML</abbr> document. This <em>does</em> find the <code>p</code> elements nested within the <code>ref</code> elements within the root <code>grammar</code> element.
 <li>The first two <code>p</code> elements are within the first <code>ref</code> (the <code>'bit'</code> <code>ref</code>).
 <li>The last <code>p</code> element is the one within the second <code>ref</code> (the <code>'byte'</code> <code>ref</code>).
 <h2 id="kgp.attributes">9.6. Accessing element attributes</h2>
-<p><acronym>XML</acronym> elements can have one or more attributes, and it is incredibly simple to access them once you have parsed an <acronym>XML</acronym> document.
+<p><abbr>XML</abbr> elements can have one or more attributes, and it is incredibly simple to access them once you have parsed an <abbr>XML</abbr> document.
 <p>For this section, you'll be using the <code>binary.xml</code> grammar file that you saw in the <a href="#kgp.search" title="9.5. Searching for elements">previous section</a>.
 <table class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">This section may be a little confusing, because of some overlapping terminology. Elements in an <acronym>XML</acronym> document have attributes, and Python objects also have attributes. When you parse an <acronym>XML</acronym> document, you get a bunch of Python objects that represent all the pieces of the <acronym>XML</acronym> document, and some of these Python objects represent attributes of the <acronym>XML</acronym> elements. But the (Python) objects that represent the (<acronym>XML</acronym>) attributes also have (Python) attributes, which are used to access various parts of the (<acronym>XML</acronym>) attribute that the object represents. I told you it was confusing. I am open to suggestions on how to distinguish these
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">This section may be a little confusing, because of some overlapping terminology. Elements in an <abbr>XML</abbr> document have attributes, and Python objects also have attributes. When you parse an <abbr>XML</abbr> document, you get a bunch of Python objects that represent all the pieces of the <abbr>XML</abbr> document, and some of these Python objects represent attributes of the <abbr>XML</abbr> elements. But the (Python) objects that represent the (<abbr>XML</abbr>) attributes also have (Python) attributes, which are used to access various parts of the (<abbr>XML</abbr>) attribute that the object represents. I told you it was confusing. I am open to suggestions on how to distinguish these
       more clearly.
 <div class=example><h3>Example 9.24. Accessing element attributes</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse('binary.xml')</kbd>
@@ -4379,7 +4379,7 @@ in Python. If your <acronym>XML</acronym> documents are all 7-bit <acronym>ASCII
 <ol>
 <li>Each <code>Element</code> object has an attribute called <code>attributes</code>, which is a <code>NamedNodeMap</code> object. This sounds scary, but it's not, because a <code>NamedNodeMap</code> is an object that <a href="#fileinfo.userdict" title="5.5. Exploring UserDict: A Wrapper Class">acts like a dictionary</a>, so you already know how to use it.
 <li>Treating the <code>NamedNodeMap</code> as a dictionary, you can get a list of the names of the attributes of this element by using <code>attributes.keys()</code>. This element has only one attribute, <code>'id'</code>.
-<li>Attribute names, like all other text in an <acronym>XML</acronym> document, are stored in <a href="#kgp.unicode" title="9.4. Unicode">unicode</a>.
+<li>Attribute names, like all other text in an <abbr>XML</abbr> document, are stored in <a href="#kgp.unicode" title="9.4. Unicode">unicode</a>.
 <li>Again treating the <code>NamedNodeMap</code> as a dictionary, you can get a list of the values of the attributes by using <code>attributes.values()</code>. The values are themselves objects, of type <code>Attr</code>. You'll see how to get useful information out of this object in the next example.
 <li>Still treating the <code>NamedNodeMap</code> as a dictionary, you can access an individual attribute by name, using normal dictionary syntax. (Readers who have been
             paying extra-close attention will already know how the <code>NamedNodeMap</code> class accomplishes this neat trick: by defining a <a href="#fileinfo.specialmethods" title="5.6. Special Class Methods"><code>__getitem__</code> special method</a>. Other readers can take comfort in the fact that they don't need to understand how it works in order to use it effectively.)
@@ -4392,11 +4392,11 @@ u'id'
 <samp class=prompt>>>> </samp><kbd>a.value</kbd> <span>&#x2461;</span>
 u'bit'</pre><div class=calloutlist>
 <ol>
-<li>The <code>Attr</code> object completely represents a single <acronym>XML</acronym> attribute of a single <acronym>XML</acronym> element. The name of the attribute (the same name as you used to find this object in the <code>bitref.attributes</code> <code>NamedNodeMap</code> pseudo-dictionary) is stored in <code>a.name</code>.
-<li>The actual text value of this <acronym>XML</acronym> attribute is stored in <code>a.value</code>.
+<li>The <code>Attr</code> object completely represents a single <abbr>XML</abbr> attribute of a single <abbr>XML</abbr> element. The name of the attribute (the same name as you used to find this object in the <code>bitref.attributes</code> <code>NamedNodeMap</code> pseudo-dictionary) is stored in <code>a.name</code>.
+<li>The actual text value of this <abbr>XML</abbr> attribute is stored in <code>a.value</code>.
 <table class=note border="0" summary="">
 
-<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Like a dictionary, attributes of an <acronym>XML</acronym> element have no ordering. Attributes may <em>happen to be</em> listed in a certain order in the original <acronym>XML</acronym> document, and the <code>Attr</code> objects may <em>happen to be</em> listed in a certain order when the <acronym>XML</acronym> document is parsed into Python objects, but these orders are arbitrary and should carry no special meaning. You should always access individual attributes
+<td rowspan="2" align="center" valign="top" width="1%"><img src="images/note.png" alt="Note" title="" width="24" height="24"><td colspan="2" align="left" valign="top" width="99%">Like a dictionary, attributes of an <abbr>XML</abbr> element have no ordering. Attributes may <em>happen to be</em> listed in a certain order in the original <abbr>XML</abbr> document, and the <code>Attr</code> objects may <em>happen to be</em> listed in a certain order when the <abbr>XML</abbr> document is parsed into Python objects, but these orders are arbitrary and should carry no special meaning. You should always access individual attributes
       by name, like the keys of a dictionary.
 <h2 id="kgp.segue">9.7. Segue</h2>
 <p>OK, that's it for the hard-core XML stuff. The next chapter will continue to use these same example programs, but focus on
@@ -4404,7 +4404,7 @@ u'bit'</pre><div class=calloutlist>
 <p>Before moving on to the next chapter, you should be comfortable doing all of these things:
 <div class=itemizedlist>
 <ul>
-<li><a href="#kgp.parse" title="9.3. Parsing XML">Parsing <acronym>XML</acronym> documents</a> using <code>minidom</code>, <a href="#kgp.search" title="9.5. Searching for elements">searching through the parsed document</a>, and accessing arbitrary <a href="#kgp.attributes" title="9.6. Accessing element attributes">element attributes</a> and <a href="#kgp.child" title="10.4. Finding direct children of a node">element children</a>
+<li><a href="#kgp.parse" title="9.3. Parsing XML">Parsing <abbr>XML</abbr> documents</a> using <code>minidom</code>, <a href="#kgp.search" title="9.5. Searching for elements">searching through the parsed document</a>, and accessing arbitrary <a href="#kgp.attributes" title="9.6. Accessing element attributes">element attributes</a> and <a href="#kgp.child" title="10.4. Finding direct children of a node">element children</a>
 <li>Organizing complex libraries into <a href="#kgp.packages" title="9.2. Packages">packages</a>
 <li><a href="#kgp.unicode" title="9.4. Unicode">Converting unicode strings</a> to different character encodings
 
@@ -4426,8 +4426,8 @@ off and returns the next chunk of data.
 <p>This is how <a href="#fileinfo.files" title="6.2. Working with File Objects">reading from real files</a> works; the difference is that you're not limiting yourself to real files. The input source could be anything: a file on
 disk, a web page, even a hard-coded string. As long as you pass a file-like object to the function, and the function simply
 calls the object's <code>read</code> method, the function can handle any kind of input source without specific code to handle each kind.
-<p>In case you were wondering how this relates to <acronym>XML</acronym> processing, <code>minidom.parse</code> is one such function which can take a file-like object.
-<div class=example><h3>Example 10.1. Parsing <acronym>XML</acronym> from a file</h3><pre class=screen>
+<p>In case you were wondering how this relates to <abbr>XML</abbr> processing, <code>minidom.parse</code> is one such function which can take a file-like object.
+<div class=example><h3>Example 10.1. Parsing <abbr>XML</abbr> from a file</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>from xml.dom import minidom</kbd>
 <samp class=prompt>>>> </samp><kbd>fsock = open('binary.xml')</kbd>    <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse(fsock)</kbd> <span>&#x2461;</span>
@@ -4446,12 +4446,12 @@ calls the object's <code>read</code> method, the function can handle any kind of
 &lt;/grammar></span></pre><div class=calloutlist>
 <ol>
 <li>First, you open the file on disk. This gives you a <a href="#fileinfo.files" title="6.2. Working with File Objects">file object</a>.
-<li>You pass the file object to <code>minidom.parse</code>, which calls the <code>read</code> method of <var>fsock</var> and reads the <acronym>XML</acronym> document from the file on disk.
+<li>You pass the file object to <code>minidom.parse</code>, which calls the <code>read</code> method of <var>fsock</var> and reads the <abbr>XML</abbr> document from the file on disk.
 <li>Be sure to call the <code>close</code> method of the file object after you're done with it. <code>minidom.parse</code> will not do this for you.
-<li>Calling the <code>toxml()</code> method on the returned <acronym>XML</acronym> document prints out the entire thing.
+<li>Calling the <code>toxml()</code> method on the returned <abbr>XML</abbr> document prints out the entire thing.
 <p>Well, that all seems like a colossal waste of time. After all, you've already seen that <code>minidom.parse</code> can simply take the filename and do all the opening and closing nonsense automatically. And it's true that if you know you're
-just going to be parsing a local file, you can pass the filename and <code>minidom.parse</code> is smart enough to Do The Right Thing&#8482;. But notice how similar -- and easy -- it is to parse an <acronym>XML</acronym> document straight from the Internet.
-<div class=example><h3 id="kgp.openanything.urllib">Example 10.2. Parsing <acronym>XML</acronym> from a <acronym>URL</acronym></h3><pre class=screen>
+just going to be parsing a local file, you can pass the filename and <code>minidom.parse</code> is smart enough to Do The Right Thing&#8482;. But notice how similar -- and easy -- it is to parse an <abbr>XML</abbr> document straight from the Internet.
+<div class=example><h3 id="kgp.openanything.urllib">Example 10.2. Parsing <abbr>XML</abbr> from a <abbr>URL</abbr></h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>import urllib</kbd>
 <samp class=prompt>>>> </samp><kbd>usock = urllib.urlopen('http://slashdot.org/slashdot.rdf')</kbd> <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse(usock)</kbd>            <span>&#x2461;</span>
@@ -4480,20 +4480,20 @@ just going to be parsing a local file, you can pass the filename and <code>minid
 
 [...snip...]</span></pre><div class=calloutlist>
 <ol>
-<li>As you saw <a href="#dialect.extract.urllib" title="Example 8.5. Introducing urllib">in a previous chapter</a>, <code>urlopen</code> takes a web page <acronym>URL</acronym> and returns a file-like object. Most importantly, this object has a <code>read</code> method which returns the <acronym>HTML</acronym> source of the web page.
-<li>Now you pass the file-like object to <code>minidom.parse</code>, which obediently calls the <code>read</code> method of the object and parses the <acronym>XML</acronym> data that the <code>read</code> method returns. The fact that this <acronym>XML</acronym> data is now coming straight from a web page is completely irrelevant. <code>minidom.parse</code> doesn't know about web pages, and it doesn't care about web pages; it just knows about file-like objects.
+<li>As you saw <a href="#dialect.extract.urllib" title="Example 8.5. Introducing urllib">in a previous chapter</a>, <code>urlopen</code> takes a web page <abbr>URL</abbr> and returns a file-like object. Most importantly, this object has a <code>read</code> method which returns the <abbr>HTML</abbr> source of the web page.
+<li>Now you pass the file-like object to <code>minidom.parse</code>, which obediently calls the <code>read</code> method of the object and parses the <abbr>XML</abbr> data that the <code>read</code> method returns. The fact that this <abbr>XML</abbr> data is now coming straight from a web page is completely irrelevant. <code>minidom.parse</code> doesn't know about web pages, and it doesn't care about web pages; it just knows about file-like objects.
 <li>As soon as you're done with it, be sure to close the file-like object that <code>urlopen</code> gives you.
-<li>By the way, this <acronym>URL</acronym> is real, and it really is <acronym>XML</acronym>. It's an <acronym>XML</acronym> representation of the current headlines on <a href="http://slashdot.org/">Slashdot</a>, a technical news and gossip site.
-<div class=example><h3>Example 10.3. Parsing <acronym>XML</acronym> from a string (the easy but inflexible way)</h3><pre class=screen>
+<li>By the way, this <abbr>URL</abbr> is real, and it really is <abbr>XML</abbr>. It's an <abbr>XML</abbr> representation of the current headlines on <a href="http://slashdot.org/">Slashdot</a>, a technical news and gossip site.
+<div class=example><h3>Example 10.3. Parsing <abbr>XML</abbr> from a string (the easy but inflexible way)</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>contents = "&lt;grammar>&lt;ref id='bit'>&lt;p>0&lt;/p>&lt;p>1&lt;/p>&lt;/ref>&lt;/grammar>"</kbd>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parseString(contents)</kbd> <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>print xmldoc.toxml()</kbd>
 <samp>&lt;?xml version="1.0" ?>
 &lt;grammar>&lt;ref id="bit">&lt;p>0&lt;/p>&lt;p>1&lt;/p>&lt;/ref>&lt;/grammar></span></pre><div class=calloutlist>
 <ol>
-<li><code>minidom</code> has a method, <code>parseString</code>, which takes an entire <acronym>XML</acronym> document as a string and parses it. You can use this instead of <code>minidom.parse</code> if you know you already have your entire <acronym>XML</acronym> document in a string.
-<p>OK, so you can use the <code>minidom.parse</code> function for parsing both local files and remote <acronym>URL</acronym>s, but for parsing strings, you use... a different function. That means that if you want to be able to take input from a
-file, a <acronym>URL</acronym>, or a string, you'll need special logic to check whether it's a string, and call the <code>parseString</code> function instead. How unsatisfying.
+<li><code>minidom</code> has a method, <code>parseString</code>, which takes an entire <abbr>XML</abbr> document as a string and parses it. You can use this instead of <code>minidom.parse</code> if you know you already have your entire <abbr>XML</abbr> document in a string.
+<p>OK, so you can use the <code>minidom.parse</code> function for parsing both local files and remote <abbr>URL</abbr>s, but for parsing strings, you use... a different function. That means that if you want to be able to take input from a
+file, a <abbr>URL</abbr>, or a string, you'll need special logic to check whether it's a string, and call the <code>parseString</code> function instead. How unsatisfying.
 <p>If there were a way to turn a string into a file-like object, then you could simply pass this object to <code>minidom.parse</code>. And in fact, there is a module specifically designed for doing just that: <code>StringIO</code>.
 <div class=example><h3 id="kgp.openanything.stringio.example">Example 10.4. Introducing <code>StringIO</code></h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>contents = "&lt;grammar>&lt;ref id='bit'>&lt;p>0&lt;/p>&lt;p>1&lt;/p>&lt;/ref>&lt;/grammar>"</kbd>
@@ -4520,7 +4520,7 @@ file, a <acronym>URL</acronym>, or a string, you'll need special logic to check
 <li>You can also read the string in chunks, by passing a <var>size</var> parameter to the <code>read</code> method.
 <li>At any time, <code>read</code> will return the rest of the string that you haven't read yet. All of this is exactly how file objects work; hence the term
 <em>file-like object</em>.
-<div class=example><h3>Example 10.5. Parsing <acronym>XML</acronym> from a string (the file-like object way)</h3><pre class=screen>
+<div class=example><h3>Example 10.5. Parsing <abbr>XML</abbr> from a string (the file-like object way)</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>contents = "&lt;grammar>&lt;ref id='bit'>&lt;p>0&lt;/p>&lt;p>1&lt;/p>&lt;/ref>&lt;/grammar>"</kbd>
 <samp class=prompt>>>> </samp><kbd>ssock = StringIO.StringIO(contents)</kbd>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse(ssock)</kbd> <span>&#x2460;</span>
@@ -4530,7 +4530,7 @@ file, a <acronym>URL</acronym>, or a string, you'll need special logic to check
 &lt;grammar>&lt;ref id="bit">&lt;p>0&lt;/p>&lt;p>1&lt;/p>&lt;/ref>&lt;/grammar></span></pre><div class=calloutlist>
 <ol>
 <li>Now you can pass the file-like object (really a <code>StringIO</code>) to <code>minidom.parse</code>, which will call the object's <code>read</code> method and happily parse away, never knowing that its input came from a hard-coded string.
-<p>So now you know how to use a single function, <code>minidom.parse</code>, to parse an <acronym>XML</acronym> document stored on a web page, in a local file, or in a hard-coded string. For a web page, you use <code>urlopen</code> to get a file-like object; for a local file, you use <code>open</code>; and for a string, you use <code>StringIO</code>. Now let's take it one step further and generalize <em>these</em> differences as well.
+<p>So now you know how to use a single function, <code>minidom.parse</code>, to parse an <abbr>XML</abbr> document stored on a web page, in a local file, or in a hard-coded string. For a web page, you use <code>urlopen</code> to get a file-like object; for a local file, you use <code>open</code>; and for a string, you use <code>StringIO</code>. Now let's take it one step further and generalize <em>these</em> differences as well.
 <div class=example><h3 id="kgp.openanything.example">Example 10.6. <code>openAnything</code></h3><pre><code>
 def openAnything(source):<span>&#x2460;</span>
     # try to open with urllib (if source is http, ftp, or file URL)
@@ -4550,12 +4550,12 @@ def openAnything(source):<span>&#x2460;</span>
     import StringIO     
     return StringIO.StringIO(str(source))  <span>&#x2463;</span></pre><div class=calloutlist>
 <ol>
-<li>The <code>openAnything</code> function takes a single parameter, <var>source</var>, and returns a file-like object. <var>source</var> is a string of some sort; it can either be a <acronym>URL</acronym> (like <code>'http://slashdot.org/slashdot.rdf'</code>), a full or partial pathname to a local file (like <code>'binary.xml'</code>), or a string that contains actual <acronym>XML</acronym> data to be parsed.
-<li>First, you see if <var>source</var> is a <acronym>URL</acronym>. You do this through brute force: you try to open it as a <acronym>URL</acronym> and silently ignore errors caused by trying to open something which is not a <acronym>URL</acronym>. This is actually elegant in the sense that, if <code>urllib</code> ever supports new types of <acronym>URL</acronym>s in the future, you will also support them without recoding. If <code>urllib</code> is able to open <var>source</var>, then the <code>return</code> kicks you out of the function immediately and the following <code>try</code> statements never execute.
-<li>On the other hand, if <code>urllib</code> yelled at you and told you that <var>source</var> wasn't a valid <acronym>URL</acronym>, you assume it's a path to a file on disk and try to open it. Again, you don't do anything fancy to check whether <var>source</var> is a valid filename or not (the rules for valid filenames vary wildly between different platforms anyway, so you'd probably
+<li>The <code>openAnything</code> function takes a single parameter, <var>source</var>, and returns a file-like object. <var>source</var> is a string of some sort; it can either be a <abbr>URL</abbr> (like <code>'http://slashdot.org/slashdot.rdf'</code>), a full or partial pathname to a local file (like <code>'binary.xml'</code>), or a string that contains actual <abbr>XML</abbr> data to be parsed.
+<li>First, you see if <var>source</var> is a <abbr>URL</abbr>. You do this through brute force: you try to open it as a <abbr>URL</abbr> and silently ignore errors caused by trying to open something which is not a <abbr>URL</abbr>. This is actually elegant in the sense that, if <code>urllib</code> ever supports new types of <abbr>URL</abbr>s in the future, you will also support them without recoding. If <code>urllib</code> is able to open <var>source</var>, then the <code>return</code> kicks you out of the function immediately and the following <code>try</code> statements never execute.
+<li>On the other hand, if <code>urllib</code> yelled at you and told you that <var>source</var> wasn't a valid <abbr>URL</abbr>, you assume it's a path to a file on disk and try to open it. Again, you don't do anything fancy to check whether <var>source</var> is a valid filename or not (the rules for valid filenames vary wildly between different platforms anyway, so you'd probably
             get them wrong anyway). Instead, you just blindly open the file, and silently trap any errors.
 <li>By this point, you need to assume that <var>source</var> is a string that has hard-coded data in it (since nothing else worked), so you use <code>StringIO</code> to create a file-like object out of it and return that. (In fact, since you're using the <code>str</code> function, <var>source</var> doesn't even need to be a string; it could be any object, and you'll use its string representation, as defined by its <code>__str__</code> <a href="#fileinfo.morespecial" title="5.7. Advanced Special Class Methods">special method</a>.)
-<p>Now you can use this <code>openAnything</code> function in conjunction with <code>minidom.parse</code> to make a function that takes a <var>source</var> that refers to an <acronym>XML</acronym> document somehow (either as a <acronym>URL</acronym>, or a local filename, or a hard-coded <acronym>XML</acronym> document in a string) and parses it.
+<p>Now you can use this <code>openAnything</code> function in conjunction with <code>minidom.parse</code> to make a function that takes a <var>source</var> that refers to an <abbr>XML</abbr> document somehow (either as a <abbr>URL</abbr>, or a local filename, or a hard-coded <abbr>XML</abbr> document in a string) and parses it.
 <div class=example><h3>Example 10.7. Using <code>openAnything</code> in <code>kgp.py</code></h3><pre><code>
 class KantGenerator:
     def _load(self, source):
@@ -4563,11 +4563,11 @@ class KantGenerator:
         xmldoc = minidom.parse(sock).documentElement
         sock.close()
         return xmldoc</pre><h2 id="kgp.stdio">10.2. Standard input, output, and error</h2>
-<p><acronym>UNIX</acronym> users are already familiar with the concept of standard input, standard output, and standard error. This section is for
+<p><abbr>UNIX</abbr> users are already familiar with the concept of standard input, standard output, and standard error. This section is for
    the rest of you.
-<p>Standard output and standard error (commonly abbreviated <code>stdout</code> and <code>stderr</code>) are pipes that are built into every <acronym>UNIX</acronym> system. When you <code>print</code> something, it goes to the <code>stdout</code> pipe; when your program crashes and prints out debugging information (like a traceback in Python), it goes to the <code>stderr</code> pipe. Both of these pipes are ordinarily just connected to the terminal window where you are working, so when a program
+<p>Standard output and standard error (commonly abbreviated <code>stdout</code> and <code>stderr</code>) are pipes that are built into every <abbr>UNIX</abbr> system. When you <code>print</code> something, it goes to the <code>stdout</code> pipe; when your program crashes and prints out debugging information (like a traceback in Python), it goes to the <code>stderr</code> pipe. Both of these pipes are ordinarily just connected to the terminal window where you are working, so when a program
 prints, you see the output, and when a program crashes, you see the debugging information. (If you're working on a system
-with a window-based Python <acronym>IDE</acronym>, <code>stdout</code> and <code>stderr</code> default to your &#8220;Interactive Window&#8221;.)
+with a window-based Python <abbr>IDE</abbr>, <code>stdout</code> and <code>stderr</code> default to your &#8220;Interactive Window&#8221;.)
 <div class=example><h3>Example 10.8. Introducing <code>stdout</code> and <code>stderr</code></h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>for i in range(3):</kbd>
 <samp class=prompt>...    </samp>print 'Dive in'             <span>&#x2460;</span>
@@ -4584,7 +4584,7 @@ Dive inDive inDive in</pre><div class=calloutlist>
 <ol>
 <li>As you saw in <a href="#fileinfo.for.counter" title="Example 6.9. Simple Counters">Example 6.9, &#8220;Simple Counters&#8221;</a>, you can use Python's built-in <code>range</code> function to build simple counter loops that repeat something a set number of times.
 <li><code>stdout</code> is a file-like object; calling its <code>write</code> function will print out whatever string you give it. In fact, this is what the <code>print</code> function really does; it adds a carriage return to the end of the string you're printing, and calls <code>sys.stdout.write</code>.
-<li>In the simplest case, <code>stdout</code> and <code>stderr</code> send their output to the same place: the Python <acronym>IDE</acronym> (if you're in one), or the terminal (if you're running Python from the command line). Like <code>stdout</code>, <code>stderr</code> does not add carriage returns for you; if you want them, add them yourself.
+<li>In the simplest case, <code>stdout</code> and <code>stderr</code> send their output to the same place: the Python <abbr>IDE</abbr> (if you're in one), or the terminal (if you're running Python from the command line). Like <code>stdout</code>, <code>stderr</code> does not add carriage returns for you; if you want them, add them yourself.
 <p><code>stdout</code> and <code>stderr</code> are both file-like objects, like the ones you discussed in <a href="#kgp.openanything" title="10.1. Abstracting input sources">Section 10.1, &#8220;Abstracting input sources&#8221;</a>, but they are both write-only. They have no <code>read</code> method, only <code>write</code>. Still, they are file-like objects, and you can assign any other file- or file-like object to them to redirect their output.
 <div class=example><h3>Example 10.9. Redirecting output</h3><pre class=screen>
 <samp class=prompt>[you@localhost kgp]$ </samp>python stdout.py
@@ -4605,11 +4605,11 @@ sys.stdout = saveout <span>&#x2465;</span>
 fsock.close()        <span>&#x2466;</span>
 </pre><div class=calloutlist>
 <ol>
-<li>This will print to the <acronym>IDE</acronym> &#8220;Interactive Window&#8221; (or the terminal, if running the script from the command line).
+<li>This will print to the <abbr>IDE</abbr> &#8220;Interactive Window&#8221; (or the terminal, if running the script from the command line).
 <li>Always save <code>stdout</code> before redirecting it, so you can set it back to normal later.
 <li>Open a file for writing. If the file doesn't exist, it will be created. If the file does exist, it will be overwritten.
 <li>Redirect all further output to the new file you just opened.
-<li>This will be &#8220;printed&#8221; to the log file only; it will not be visible in the <acronym>IDE</acronym> window or on the screen.
+<li>This will be &#8220;printed&#8221; to the log file only; it will not be visible in the <abbr>IDE</abbr> window or on the screen.
 <li>Set <code>stdout</code> back to the way it was before you mucked with it.
 <li>Close the log file.
 <p>Redirecting <code>stderr</code> works exactly the same way, using <code>sys.stderr</code> instead of <code>sys.stdout</code>.
@@ -4645,7 +4645,7 @@ entering function
 <ol>
 <li>This shorthand syntax of the <code>print</code> statement can be used to write to any open file, or file-like object. In this case, you can redirect a single <code>print</code> statement to <code>stderr</code> without affecting subsequent <code>print</code> statements.
 <p>Standard input, on the other hand, is a read-only file object, and it represents the data flowing into the program from some
-previous program. This will likely not make much sense to classic Mac OS users, or even Windows users unless you were ever fluent on the <acronym>MS-DOS</acronym> command line. The way it works is that you can construct a chain of commands in a single line, so that one program's output
+previous program. This will likely not make much sense to classic Mac OS users, or even Windows users unless you were ever fluent on the <abbr>MS-DOS</abbr> command line. The way it works is that you can construct a chain of commands in a single line, so that one program's output
 becomes the input for the next program in the chain. The first program simply outputs to standard output (without doing any
 special redirecting itself, just doing normal <code>print</code> statements or whatever), and the next program reads from standard input, and the operating system takes care of connecting
 one program's output to the next program's input.
@@ -4693,7 +4693,7 @@ def openAnything(source):
 <ol>
 <li>This is the <code>openAnything</code> function from <code>toolbox.py</code>, which you previously examined in <a href="#kgp.openanything" title="10.1. Abstracting input sources">Section 10.1, &#8220;Abstracting input sources&#8221;</a>. All you've done is add three lines of code at the beginning of the function to check if the source is &#8220;<code>-</code>&#8221;; if so, you return <code>sys.stdin</code>. Really, that's it!  Remember, <code>stdin</code> is a file-like object with a <code>read</code> method, so the rest of the code (in <code>kgp.py</code>, where you call <code>openAnything</code>) doesn't change a bit.
 <h2 id="kgp.cache">10.3. Caching node lookups</h2>
-<p><code>kgp.py</code> employs several tricks which may or may not be useful to you in your <acronym>XML</acronym> processing. The first one takes advantage of the consistent structure of the input documents to build a cache of nodes.
+<p><code>kgp.py</code> employs several tricks which may or may not be useful to you in your <abbr>XML</abbr> processing. The first one takes advantage of the consistent structure of the input documents to build a cache of nodes.
 <p>A grammar file defines a series of <code>ref</code> elements. Each <code>ref</code> contains one or more <code>p</code> elements, which can contain a lot of different things, including <code>xref</code>s. Whenever you encounter an <code>xref</code>, you look for a corresponding <code>ref</code> element with the same <code>id</code> attribute, and choose one of the <code>ref</code> element's children and parse it. (You'll see how this random choice is made in the next section.)
 <p>This is how you build up the grammar: define <code>ref</code> elements for the smallest pieces, then define <code>ref</code> elements which "include" the first <code>ref</code> elements by using <code>xref</code>, and so forth. Then you parse the "largest" reference and follow each <code>xref</code>, and eventually output real text. The text you output depends on the (random) decisions you make each time you fill in an
 <code>xref</code>, so the output is different each time.
@@ -4708,14 +4708,14 @@ def openAnything(source):
 <li>Start by creating an empty dictionary, <var>self.refs</var>.
 <li>As you saw in <a href="#kgp.search" title="9.5. Searching for elements">Section 9.5, &#8220;Searching for elements&#8221;</a>, <code>getElementsByTagName</code> returns a list of all the elements of a particular name. You easily can get a list of all the <code>ref</code> elements, then simply loop through that list.
 <li>As you saw in <a href="#kgp.attributes" title="9.6. Accessing element attributes">Section 9.6, &#8220;Accessing element attributes&#8221;</a>, you can access individual attributes of an element by name, using standard dictionary syntax. So the keys of the <var>self.refs</var> dictionary will be the values of the <code>id</code> attribute of each <code>ref</code> element.
-<li>The values of the <var>self.refs</var> dictionary will be the <code>ref</code> elements themselves. As you saw in <a href="#kgp.parse" title="9.3. Parsing XML">Section 9.3, &#8220;Parsing XML&#8221;</a>, each element, each node, each comment, each piece of text in a parsed <acronym>XML</acronym> document is an object.
+<li>The values of the <var>self.refs</var> dictionary will be the <code>ref</code> elements themselves. As you saw in <a href="#kgp.parse" title="9.3. Parsing XML">Section 9.3, &#8220;Parsing XML&#8221;</a>, each element, each node, each comment, each piece of text in a parsed <abbr>XML</abbr> document is an object.
 <p>Once you build this cache, whenever you come across an <code>xref</code> and need to find the <code>ref</code> element with the same <code>id</code> attribute, you can simply look it up in <var>self.refs</var>.
 <div class=example><h3>Example 10.15. Using the <code>ref</code> element cache</h3><pre><code>
     def do_xref(self, node):
         id = node.attributes["id"].value
         self.parse(self.randomChildElement(self.refs[id]))</pre><p>You'll explore the <code>randomChildElement</code> function in the next section.
 <h2 id="kgp.child">10.4. Finding direct children of a node</h2>
-<p>Another useful techique when parsing <acronym>XML</acronym> documents is finding all the direct child elements of a particular element. For instance, in the grammar files, a <code>ref</code> element can have several <code>p</code> elements, each of which can contain many things, including other <code>p</code> elements. You want to find just the <code>p</code> elements that are children of the <code>ref</code>, not <code>p</code> elements that are children of other <code>p</code> elements.
+<p>Another useful techique when parsing <abbr>XML</abbr> documents is finding all the direct child elements of a particular element. For instance, in the grammar files, a <code>ref</code> element can have several <code>p</code> elements, each of which can contain many things, including other <code>p</code> elements. You want to find just the <code>p</code> elements that are children of the <code>ref</code>, not <code>p</code> elements that are children of other <code>p</code> elements.
 <p>You might think you could simply use <code>getElementsByTagName</code> for this, but you can't. <code>getElementsByTagName</code> searches recursively and returns a single list for all the elements it finds. Since <code>p</code> elements can contain other <code>p</code> elements, you can't use <code>getElementsByTagName</code>, because it would return nested <code>p</code> elements that you don't want. To find only direct child elements, you'll need to do it yourself.
 <div class=example><h3>Example 10.16. Finding direct child elements</h3><pre><code>
     def randomChildElement(self, node):
@@ -4731,8 +4731,8 @@ def openAnything(source):
             those nodes whose <var>nodeType</var> is <code>ELEMENT_NODE</code>.
 <li>Once you have a list of actual elements, choosing a random one is easy. Python comes with a module called <code>random</code> which includes several useful functions. The <code>random.choice</code> function takes a list of any number of items and returns a random item. For example, if the <code>ref</code> elements contains several <code>p</code> elements, then <var>choices</var> would be a list of <code>p</code> elements, and <var>chosen</var> would end up being assigned exactly one of them, selected at random.
 <h2 id="kgp.handler">10.5. Creating separate handlers by node type</h2>
-<p>The third useful <acronym>XML</acronym> processing tip involves separating your code into logical functions, based on node types and element names. Parsed <acronym>XML</acronym> documents are made up of various types of nodes, each represented by a Python object. The root level of the document itself is represented by a <code>Document</code> object. The <code>Document</code> then contains one or more <code>Element</code> objects (for actual <acronym>XML</acronym> tags), each of which may contain other <code>Element</code> objects, <code>Text</code> objects (for bits of text), or <code>Comment</code> objects (for embedded comments). Python makes it easy to write a dispatcher to separate the logic for each node type.
-<div class=example><h3>Example 10.17. Class names of parsed <acronym>XML</acronym> objects</h3><pre class=screen>
+<p>The third useful <abbr>XML</abbr> processing tip involves separating your code into logical functions, based on node types and element names. Parsed <abbr>XML</abbr> documents are made up of various types of nodes, each represented by a Python object. The root level of the document itself is represented by a <code>Document</code> object. The <code>Document</code> then contains one or more <code>Element</code> objects (for actual <abbr>XML</abbr> tags), each of which may contain other <code>Element</code> objects, <code>Text</code> objects (for bits of text), or <code>Comment</code> objects (for embedded comments). Python makes it easy to write a dispatcher to separate the logic for each node type.
+<div class=example><h3>Example 10.17. Class names of parsed <abbr>XML</abbr> objects</h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>from xml.dom import minidom</kbd>
 <samp class=prompt>>>> </samp><kbd>xmldoc = minidom.parse('kant.xml')</kbd> <span>&#x2460;</span>
 <samp class=prompt>>>> </samp><kbd>xmldoc</kbd>
@@ -4743,11 +4743,11 @@ def openAnything(source):
 'Document'</pre><div class=calloutlist>
 <ol>
 <li>Assume for a moment that <code>kant.xml</code> is in the current directory.
-<li>As you saw in <a href="#kgp.packages" title="9.2. Packages">Section 9.2, &#8220;Packages&#8221;</a>, the object returned by parsing an <acronym>XML</acronym> document is a <code>Document</code> object, as defined in the <code>minidom.py</code> in the <code>xml.dom</code> package. As you saw in <a href="#fileinfo.create" title="5.4. Instantiating Classes">Section 5.4, &#8220;Instantiating Classes&#8221;</a>, <code>__class__</code> is built-in attribute of every Python object.
+<li>As you saw in <a href="#kgp.packages" title="9.2. Packages">Section 9.2, &#8220;Packages&#8221;</a>, the object returned by parsing an <abbr>XML</abbr> document is a <code>Document</code> object, as defined in the <code>minidom.py</code> in the <code>xml.dom</code> package. As you saw in <a href="#fileinfo.create" title="5.4. Instantiating Classes">Section 5.4, &#8220;Instantiating Classes&#8221;</a>, <code>__class__</code> is built-in attribute of every Python object.
 <li>Furthermore, <code>__name__</code> is a built-in attribute of every Python class, and it is a string. This string is not mysterious; it's the same as the class name you type when you define a class
             yourself. (See <a href="#fileinfo.class" title="5.3. Defining Classes">Section 5.3, &#8220;Defining Classes&#8221;</a>.)
-<p>Fine, so now you can get the class name of any particular <acronym>XML</acronym> node (since each <acronym>XML</acronym> node is represented as a Python object). How can you use this to your advantage to separate the logic of parsing each node type?  The answer is <code>getattr</code>, which you first saw in <a href="#apihelper.getattr" title="4.4. Getting Object References With getattr">Section 4.4, &#8220;Getting Object References With getattr&#8221;</a>.
-<div class=example><h3>Example 10.18. <code>parse</code>, a generic <acronym>XML</acronym> node dispatcher</h3><pre><code>
+<p>Fine, so now you can get the class name of any particular <abbr>XML</abbr> node (since each <abbr>XML</abbr> node is represented as a Python object). How can you use this to your advantage to separate the logic of parsing each node type?  The answer is <code>getattr</code>, which you first saw in <a href="#apihelper.getattr" title="4.4. Getting Object References With getattr">Section 4.4, &#8220;Getting Object References With getattr&#8221;</a>.
+<div class=example><h3>Example 10.18. <code>parse</code>, a generic <abbr>XML</abbr> node dispatcher</h3><pre><code>
     def parse(self, node):          
         parseMethod = getattr(self, "parse_%s" % node.__class__.__name__) <span>&#x2460;</span> <span>&#x2461;</span>
         parseMethod(node) <span>&#x2462;</span></pre><div class=calloutlist>
@@ -4775,7 +4775,7 @@ def openAnything(source):
         handlerMethod = getattr(self, "do_%s" % node.tagName)
         handlerMethod(node)</pre><div class=calloutlist>
 <ol>
-<li><code>parse_Document</code> is only ever called once, since there is only one <code>Document</code> node in an <acronym>XML</acronym> document, and only one <code>Document</code> object in the parsed <acronym>XML</acronym> representation. It simply turns around and parses the root element of the grammar file.
+<li><code>parse_Document</code> is only ever called once, since there is only one <code>Document</code> node in an <abbr>XML</abbr> document, and only one <code>Document</code> object in the parsed <abbr>XML</abbr> representation. It simply turns around and parses the root element of the grammar file.
 <li><code>parse_Text</code> is called on nodes that represent bits of text. The function itself does some special processing to handle automatic capitalization
             of the first word of a sentence, but otherwise simply appends the represented text to a list.
 <li><code>parse_Comment</code> is just a <code>pass</code>, since you don't care about embedded comments in the grammar files. Note, however, that you still need to define the function
@@ -4789,7 +4789,7 @@ you could break up your code into separate modules, and use dynamic importing to
 you needed. Dynamic importing will be discussed in <a href="#regression" title="Chapter 16. Functional Programming">Chapter 16, <i>Functional Programming</i></a>.
 <h2 id="kgp.commandline">10.6. Handling command-line arguments</h2>
 <p>Python fully supports creating programs that can be run on the command line, complete with command-line arguments and either short-
-   or long-style flags to specify various options. None of this is <acronym>XML</acronym>-specific, but this script makes good use of command-line processing, so it seemed like a good time to mention it.
+   or long-style flags to specify various options. None of this is <abbr>XML</abbr>-specific, but this script makes good use of command-line processing, so it seemed like a good time to mention it.
 <p>It's difficult to talk about command-line processing without understanding how command-line arguments are exposed to your
 Python program, so let's write a simple program to see them.
 <div class=example><h3>Example 10.20. Introducing <var>sys.argv</var></h3>
@@ -4846,7 +4846,7 @@ if __name__ == "__main__":
             command-line flags that are equivalent to the single-character versions. This is quite confusing at first glance, and is
             explained in more detail below.
 <li>If anything goes wrong trying to parse these command-line flags, <code>getopt</code> will raise an exception, which you catch. You told <code>getopt</code> all the flags you understand, so this probably means that the end user passed some command-line flag that you don't understand.
-<li>As is standard practice in the <acronym>UNIX</acronym> world, when the script is passed flags it doesn't understand, you print out a summary of proper usage and exit gracefully.
+<li>As is standard practice in the <abbr>UNIX</abbr> world, when the script is passed flags it doesn't understand, you print out a summary of proper usage and exit gracefully.
              Note that I haven't shown the <code>usage</code> function here. You would still need to code that somewhere and have it print out the appropriate summary; it's not automatic.
 <p>So what are all those parameters you pass to the <code>getopt</code> function?  Well, the first one is simply the raw list of command-line flags and arguments (not including the first element,
 the script name, which you already chopped off before calling the <code>main</code> function). The second is the list of short command-line flags that the script accepts.
@@ -4932,12 +4932,12 @@ def main(argv):
     for opt, arg in opts:               
 ...</pre><p>You create a new instance of the <code>KantGenerator</code> class, and pass it the grammar file and source that may or may not have been specified on the command line.
 <pre><code>
-    k = KantGenerator(grammar, source)</pre><p>The <code>KantGenerator</code> instance automatically loads the grammar, which is an <acronym>XML</acronym> file. You use your custom <code>openAnything</code> function to open the file (which <a href="#kgp.openanything" title="10.1. Abstracting input sources">could be stored in a local file or a remote web server</a>), then use the built-in <code>minidom</code> parsing functions to <a href="#kgp.parse" title="9.3. Parsing XML">parse the <acronym>XML</acronym> into a tree of Python objects</a>.
+    k = KantGenerator(grammar, source)</pre><p>The <code>KantGenerator</code> instance automatically loads the grammar, which is an <abbr>XML</abbr> file. You use your custom <code>openAnything</code> function to open the file (which <a href="#kgp.openanything" title="10.1. Abstracting input sources">could be stored in a local file or a remote web server</a>), then use the built-in <code>minidom</code> parsing functions to <a href="#kgp.parse" title="9.3. Parsing XML">parse the <abbr>XML</abbr> into a tree of Python objects</a>.
 <pre><code>
     def _load(self, source):
         sock = toolbox.openAnything(source)
         xmldoc = minidom.parse(sock).documentElement
-        sock.close()</pre><p>Oh, and along the way, you take advantage of your knowledge of the structure of the <acronym>XML</acronym> document to <a href="#kgp.cache" title="10.3. Caching node lookups">set up a little cache of references</a>, which are just elements in the <acronym>XML</acronym> document.
+        sock.close()</pre><p>Oh, and along the way, you take advantage of your knowledge of the structure of the <abbr>XML</abbr> document to <a href="#kgp.cache" title="10.3. Caching node lookups">set up a little cache of references</a>, which are just elements in the <abbr>XML</abbr> document.
 <pre><code>
     def loadGrammar(self, grammar):       
         for ref in self.grammar.getElementsByTagName("ref"):
@@ -4950,7 +4950,7 @@ the "top-level" reference (that isn't referenced by anything else) and use that
             xrefs[xref.attributes["id"].value] = 1
         xrefs = xrefs.keys()
         standaloneXrefs = [e for e in self.refs.keys() if e not in xrefs]
-        return '&lt;xref id="%s"/>' % random.choice(standaloneXrefs)</pre><p>Now you rip through the source material. The source material is also <acronym>XML</acronym>, and you parse it one node at a time. To keep the code separated and more maintainable, you use <a href="#kgp.handler" title="10.5. Creating separate handlers by node type">separate handlers for each node type</a>.
+        return '&lt;xref id="%s"/>' % random.choice(standaloneXrefs)</pre><p>Now you rip through the source material. The source material is also <abbr>XML</abbr>, and you parse it one node at a time. To keep the code separated and more maintainable, you use <a href="#kgp.handler" title="10.5. Creating separate handlers by node type">separate handlers for each node type</a>.
 <pre><code>
     def parse_Element(self, node): 
         handlerMethod = getattr(self, "do_%s" % node.tagName)
@@ -4977,7 +4977,7 @@ def main(argv):
 ...
     k = KantGenerator(grammar, source)
     print k.output()</pre><h2 id="kgp.summary">10.8. Summary</h2>
-<p>Python comes with powerful libraries for parsing and manipulating <acronym>XML</acronym> documents. The <code>minidom</code> takes an <acronym>XML</acronym> file and parses it into Python objects, providing for random access to arbitrary elements. Furthermore, this chapter shows how Python can be used to create a "real" standalone command-line script, complete with command-line flags, command-line arguments,
+<p>Python comes with powerful libraries for parsing and manipulating <abbr>XML</abbr> documents. The <code>minidom</code> takes an <abbr>XML</abbr> file and parses it into Python objects, providing for random access to arbitrary elements. Furthermore, this chapter shows how Python can be used to create a "real" standalone command-line script, complete with command-line flags, command-line arguments,
    error handling, even the ability to take input from the piped result of a previous program.
 <p>Before moving on to the next chapter, you should be comfortable doing all of these things:
 <div class=itemizedlist>
@@ -5226,7 +5226,7 @@ header: Connection: close
 <li>Now that the debugging flag is set, information on the the HTTP request and response is printed out in real time. The first
          thing it tells you is that you're connecting to the server <code>diveintomark.org</code> on port 80, which is the standard port for HTTP.
 <li>When you request the Atom feed, <code>urllib</code> sends three lines to the server. The first line specifies the HTTP verb you're using, and the path of the resource (minus
-         the domain name). All the requests in this chapter will use <code>GET</code>, but in the next chapter on <acronym>SOAP</acronym>, you'll see that it uses <code>POST</code> for everything. The basic syntax is the same, regardless of the verb.
+         the domain name). All the requests in this chapter will use <code>GET</code>, but in the next chapter on <abbr>SOAP</abbr>, you'll see that it uses <code>POST</code> for everything. The basic syntax is the same, regardless of the verb.
 <li>The second line is the <code>Host</code> header, which specifies the domain name of the service you're accessing. This is important, because a single HTTP server
          can host multiple separate domains. My server currently hosts 12 domains; other servers can host hundreds or even thousands.
 <li>The third line is the <code>User-Agent</code> header. What you see here is the generic <code>User-Agent</code> that the <code>urllib</code> library adds by default. In the next section, you'll see how to customize this to be more specific.
@@ -5263,7 +5263,7 @@ header: Content-Length: 26848
 header: Connection: close
 </pre><div class=calloutlist>
 <ol>
-<li>If you still have your Python <acronym>IDE</acronym> open from the previous section's example, you can skip this, but this turns on <a href="#oa.debug" title="11.4. Debugging HTTP web services">HTTP debugging</a> so you can see what you're actually sending over the wire, and what gets sent back.
+<li>If you still have your Python <abbr>IDE</abbr> open from the previous section's example, you can skip this, but this turns on <a href="#oa.debug" title="11.4. Debugging HTTP web services">HTTP debugging</a> so you can see what you're actually sending over the wire, and what gets sent back.
 <li>Fetching an HTTP resource with <code>urllib2</code> is a three-step process, for good reasons that will become clear shortly. The first step is to create a <code>Request</code> object, which takes the URL of the resource you'll eventually get around to retrieving. Note that this step doesn't actually
             retrieve anything yet.
 <li>The second step is to build a URL opener. This can take any number of handlers, which control how responses are handled.
@@ -5387,7 +5387,7 @@ class DefaultErrorHandler(urllib2.HTTPDefaultErrorHandler):    <span>&#x2460;</s
 <li>Now you can quietly open the resource, and what you get back is an object that, along with the usual headers (use <var>seconddatastream.headers.dict</var> to acess them), also contains the HTTP status code. In this case, as you expected, the status is <code>304</code>, meaning this data hasn't changed since the last time you asked for it.
 <li>Note that when the server sends back a <code>304</code> status code, it doesn't re-send the data. That's the whole point: to save bandwidth by not re-downloading data that hasn't
             changed. So if you actually want that data, you'll need to cache it locally the first time you get it.
-<p>Handling <code>ETag</code> works much the same way, but instead of checking for <code>Last-Modified</code> and sending <code>If-Modified-Since</code>, you check for <code>ETag</code> and send <code>If-None-Match</code>. Let's start with a fresh <acronym>IDE</acronym> session.
+<p>Handling <code>ETag</code> works much the same way, but instead of checking for <code>Last-Modified</code> and sending <code>If-Modified-Since</code>, you check for <code>ETag</code> and send <code>If-None-Match</code>. Let's start with a fresh <abbr>IDE</abbr> session.
 <div class=example><h3 id="oa.etags.example">Example 11.9. Supporting <code>ETag</code>/<code>If-None-Match</code></h3><pre class=screen>
 <samp class=prompt>>>> </samp><kbd>import urllib2, openanything</kbd>
 <samp class=prompt>>>> </samp><kbd>request = urllib2.Request('http://diveintomark.org/xml/atom.xml')</kbd>
@@ -5812,7 +5812,7 @@ numerals. You saw the mechanics of constructing and validating Roman numerals in
 <div class=orderedlist>
 <ol>
 <li>There is only one correct way to represent a particular number as Roman numerals.
-<li>The converse is also true: if a string of characters is a valid Roman numeral, it represents only one number (<i class=foreignphrase><acronym>i.e.</acronym></i> it can only be read one way).
+<li>The converse is also true: if a string of characters is a valid Roman numeral, it represents only one number (<i class=foreignphrase><abbr>i.e.</abbr></i> it can only be read one way).
 
 <li>There is a limited range of numbers that can be expressed as Roman numerals, specifically <code>1</code> through <code>3999</code>. (The Romans did have several ways of expressing larger numbers, for instance by having a bar over a numeral to represent
       that its normal value should be multiplied by <code>1000</code>, but you're not going to deal with that. For the purposes of this chapter, let's stipulate that Roman numerals go from <code>1</code> to <code>3999</code>.)
@@ -5840,7 +5840,7 @@ numerals. You saw the mechanics of constructing and validating Roman numerals in
 
 <li><code>to_roman()</code> should always return a Roman numeral using uppercase letters.
 
-<li><code>from_roman()</code> should only accept uppercase Roman numerals (<i class=foreignphrase><acronym>i.e.</acronym></i> it should fail when given lowercase input).
+<li><code>from_roman()</code> should only accept uppercase Roman numerals (<i class=foreignphrase><abbr>i.e.</abbr></i> it should fail when given lowercase input).
 
 </ol>
 <div class=itemizedlist>
@@ -5942,7 +5942,7 @@ class SanityCheck(unittest.TestCase):
 <ol start="7">
 <li><code>to_roman()</code> should always return a Roman numeral using uppercase letters.
 
-<li><code>from_roman()</code> should only accept uppercase Roman numerals (<i class=foreignphrase><acronym>i.e.</acronym></i> it should fail when given lowercase input).
+<li><code>from_roman()</code> should only accept uppercase Roman numerals (<i class=foreignphrase><abbr>i.e.</abbr></i> it should fail when given lowercase input).
 
 </ol>
 <p>In fact, they are somewhat arbitrary. You could, for instance, have stipulated that <code>from_roman()</code> accept lowercase and mixed case input. But they are not completely arbitrary; if <code>to_roman()</code> is always returning uppercase output, then <code>from_roman()</code> must at least accept uppercase input, or the &#8220;sanity check&#8221; (requirement #6) would fail. The fact that it <em>only</em> accepts uppercase input is arbitrary, but as any systems integrator will tell you, case always matters, so it's worth specifying
@@ -6012,10 +6012,10 @@ def from_roman(s):
             have inherited each individual exception from the <code>Exception</code> class directly.
 <li>The <code>OutOfRangeError</code> and <code>NotIntegerError</code> exceptions will eventually be used by <code>to_roman()</code> to flag various forms of invalid input, as specified in <a href="#roman.tobadinput.example" title="Example 13.3. Testing bad input to to_roman"><code>ToRomanBadInput</code></a>.
 <li>The <code>InvalidRomanNumeralError</code> exception will eventually be used by <code>from_roman()</code> to flag invalid input, as specified in <a href="#roman.frombadinput.example" title="Example 13.4. Testing bad input to from_roman"><code>FromRomanBadInput</code></a>.
-<li>At this stage, you want to define the <acronym>API</acronym> of each of your functions, but you don't want to code them yet, so you stub them out using the Python reserved word <a href="#fileinfo.class.simplest" title="Example 5.3. The Simplest Python Class"><code>pass</code></a>.
+<li>At this stage, you want to define the <abbr>API</abbr> of each of your functions, but you don't want to code them yet, so you stub them out using the Python reserved word <a href="#fileinfo.class.simplest" title="Example 5.3. The Simplest Python Class"><code>pass</code></a>.
 <p>Now for the big moment (drum roll please): you're finally going to run the unit test against this stubby little module. At
 this point, every test case should fail. In fact, if any test case passes in stage 1, you should go back to <code>romantest.py</code> and re-evaluate why you coded a test so useless that it passes with do-nothing functions.
-<li>At this stage, you want to define the <acronym>API</acronym> of each of your functions, but you don't want to code them yet, so you stub them out using the Python reserved word <a href="#fileinfo.class.simplest" title="Example 5.3. The Simplest Python Class"><code>pass</code></a>.
+<li>At this stage, you want to define the <abbr>API</abbr> of each of your functions, but you don't want to code them yet, so you stub them out using the Python reserved word <a href="#fileinfo.class.simplest" title="Example 5.3. The Simplest Python Class"><code>pass</code></a>.
 <p>Run <code>romantest1.py</code> with the <code>-v</code> command-line option, which will give more verbose output so you can see exactly what's going on as each test case runs. 
 With any luck, your output should look like this:
 <div class=example><h3 id="roman.stage1.output">Example 14.2. Output of <code>romantest1.py</code> against <code>roman1.py</code></h3><pre class=screen><samp>from_roman should only accept uppercase input ... ERROR
diff --git a/dip3.css b/dip3.css
index 0abc379..1ddd8cc 100644
--- a/dip3.css
+++ b/dip3.css
@@ -27,15 +27,19 @@ a:visited{color:darkorchid}
 .skip a:active,.skip a:focus{position:static;width:auto;height:auto}
 
 /* code blocks */
-pre{white-space:pre-wrap;padding-left:2.154em;line-height:2.154;border-left:1px dotted}
+pre{white-space:pre-wrap;padding-left:2.154em;line-height:2.154;border-left:1px solid gainsboro}
 .widgets{float:left}
 .widgets,.widgets a,.download{font-size:small;line-height:2.154}
-.block,ol{clear:left}
+.block,ol,p,blockquote{clear:left}
 pre a,.widgets a{padding:0.4375em 0;border:0}
 .widgets a{text-decoration:underline}
 pre a:hover{border:0}
 kbd{font-weight:bold}
 .prompt{color:#667}
+ins,del,mark{text-decoration:none;font-style:normal;display:inline-block;width:100%;line-height:2.154}
+del{background:salmon}
+ins{background:palegreen}
+mark{background:#ffff80}
 
 /* tables */
 table{width:100%;border-collapse:collapse}
@@ -45,7 +49,7 @@ td{vertical-align:top}
 th:first-child{width:10%;text-align:center}
 .simple th{font-family:inherit !important}
 .hover{background:#eee;color:inherit;cursor:default}
-td pre{margin:0;padding:0;border:0}
+td pre{margin:0;padding:0;border:0;background:inherit}
 
 /* headers */
 h1,h2,h3,p,ul,ol{margin:1.75em 0;font-size:medium}
@@ -57,3 +61,6 @@ h1{counter-reset:h2}
 h2:before{counter-increment:h2;content:counter(h1) "." counter(h2) ". "}
 h2{counter-reset:h3}
 h3:before{counter-increment:h3;content:counter(h1) "." counter(h2) "." counter(h3) ". "}
+
+/* HTML 5 support */
+article,aside,dialog,footer,header,section{display:block}
\ No newline at end of file
diff --git a/index.html b/index.html
index ff4e168..505a0ad 100644
--- a/index.html
+++ b/index.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Dive Into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
@@ -10,32 +11,33 @@
 .first{clear:both;margin-top:0;padding-top:1.75em}
 li:last-child{list-style:none;margin:0 0 0 -1.7em}
 li:last-child:before{content:"A. \00a0 \00a0"}
+li.todo{background:white;color:gainsboro}
 </style>
 </head>
 <form action=http://www.google.com/cse id=search><div><input type=hidden name=cx value=014021643941856155761:l5eihuescdw><input type=hidden name=ie value=UTF-8><input name=q size=31>&nbsp;<input type=submit name=sa value=Search></div></form>
 <p class=first><cite>Dive Into Python 3</cite> will cover Python 3 and its differences from Python 2. Compared to the original <cite><a href=http://diveintopython.org/>Dive Into Python</a></cite>, it will be about 50% revised and 50% new material. I will publish drafts online as I go. The final version will be published on paper by Apress. The book will remain online under the <a rel=license href=http://creativecommons.org/licenses/by-sa/3.0/>CC-BY-SA-3.0</a> license.
 <p>You can see the <a href=table-of-contents.html>full table of contents</a> (<strong>not finalized</strong>), or read what I&#8217;ve written so far:</p>
 <ol start=0>
-<li>
+<li class=todo>Installing Python
 <li><a href=your-first-python-program.html>Your first Python program</a>
 <li><a href=native-datatypes.html>Native datatypes</a>
-<li>
+<li class=todo>Strings
 <li><a href=regular-expressions.html>Regular expressions</a>
-<li>
-<li>
+<li class=todo>The power of introspection
+<li class=todo>Objects and object-orientation
 <li><a href=unit-testing.html>Unit testing</a>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
-<li>
+<li class=todo>Test-first programming
+<li class=todo>Refactoring your code
+<li class=todo>Files
+<li class=todo>HTML processing
+<li class=todo>XML processing
+<li class=todo>Web services
+<li class=todo>Dynamic functions
+<li class=todo>Metaclasses
+<li class=todo>Performance tuning
+<li class=todo>Packaging Python libraries
+<li class=todo>Creating graphics with the Python Imaging Library
+<li class=todo>Where to go from here
 <li><a href=case-study-porting-chardet-to-python-3.html>Case study: porting <code>chardet</code> to Python 3</a>
 <li><a href=porting-code-to-python-3-with-2to3.html>Porting code to Python 3 with <code>2to3</code></a>
 </ol>
diff --git a/native-datatypes.html b/native-datatypes.html
index 96b52e6..884e6ac 100644
--- a/native-datatypes.html
+++ b/native-datatypes.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Native datatypes - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
diff --git a/porting-code-to-python-3-with-2to3.html b/porting-code-to-python-3-with-2to3.html
index cbd8d49..15e7f17 100644
--- a/porting-code-to-python-3-with-2to3.html
+++ b/porting-code-to-python-3-with-2to3.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Porting code to Python 3 with 2to3 - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
diff --git a/publish b/publish
index 3c929c6..b8d585f 100644
--- a/publish
+++ b/publish
@@ -14,8 +14,6 @@ sed -i -e "s|//}.; /\* google\..*|});|g" build/dip3.js
 revision=`hg log|grep changeset|cut -d":" -f3|head -1`
 java -jar yuicompressor-2.4.2.jar build/dip3.js > build/dip3.$revision.min.js
 java -jar yuicompressor-2.4.2.jar build/dip3.css > build/dip3.$revision.min.css
-#rm build/dip3.js
-#rm build/dip3.css
 sed -i -e "s|dip3\.js|http://wearehugh.com/dip3/dip3.${revision}.min.js|g" build/*.html
 sed -i -e "s|dip3\.css|http://wearehugh.com/dip3/dip3.${revision}.min.css|g" build/*.html
 
@@ -23,5 +21,5 @@ sed -i -e "s|dip3\.css|http://wearehugh.com/dip3/dip3.${revision}.min.css|g" bui
 chmod 644 build/*.html build/*.css build/*.js build/*.py build/*.txt build/.htaccess
 
 # and push to production
-rsync -essh -avzP --delete --delete-after build/*.min.css build/*.min.js diveintomark.org:~/web/wearehugh.com/dip3/
+rsync -essh -avzP --delete --delete-after build/*.min.css build/*.min.js build/html5.js diveintomark.org:~/web/wearehugh.com/dip3/
 rsync -essh -avzP build/*.html build/*.py build/*.txt build/.htaccess diveintomark.org:~/web/diveintopython3.org/
diff --git a/regular-expressions.html b/regular-expressions.html
index 776d247..b55fe31 100644
--- a/regular-expressions.html
+++ b/regular-expressions.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Regular expressions - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
diff --git a/table-of-contents.html b/table-of-contents.html
index c8d668c..87bbccf 100644
--- a/table-of-contents.html
+++ b/table-of-contents.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Table of contents - Dive Into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
diff --git a/unit-testing.html b/unit-testing.html
index 758154b..94ba851 100644
--- a/unit-testing.html
+++ b/unit-testing.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Unit testing - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
@@ -134,7 +135,7 @@ if __name__ == "__main__":
 <li>To write a test case, first subclass the <code>TestCase</code> class of the <code>unittest</code> module. This class provides many useful methods which you can use in your test case to test specific conditions.
 <li>This is a list of integer/numeral pairs that I verified manually. It includes the lowest ten numbers, the highest number, every number that translates to a single-character Roman numeral, and a random sampling of other valid numbers. The point of a unit test is not to test every possible input, but to test a representative sample.
 <li>Every individual test is its own method, which must take no parameters and return no value. If the method exits normally without raising an exception, the test is considered passed; if the method raises an exception, the test is considered failed.
-<li>Here you call the actual <code>to_roman()</code> function. (Well, the function hasn't be written yet, but once it is, this is the line that will call it.)  Notice that you have now defined the <acronym>API</acronym> for the <code>to_roman()</code> function: it must take an integer (the number to convert) and return a string (the Roman numeral representation). If the <acronym>API</acronym> is different than that, this test is considered failed. Also notice that you are not trapping any exceptions when you call <code>to_roman()</code>. This is intentional. <code>to_roman()</code> shouldn't raise an exception when you call it with valid input, and these input values are all valid. If <code>to_roman()</code> raises an exception, this test is considered failed.
+<li>Here you call the actual <code>to_roman()</code> function. (Well, the function hasn't be written yet, but once it is, this is the line that will call it.)  Notice that you have now defined the <abbr>API</abbr> for the <code>to_roman()</code> function: it must take an integer (the number to convert) and return a string (the Roman numeral representation). If the <abbr>API</abbr> is different than that, this test is considered failed. Also notice that you are not trapping any exceptions when you call <code>to_roman()</code>. This is intentional. <code>to_roman()</code> shouldn't raise an exception when you call it with valid input, and these input values are all valid. If <code>to_roman()</code> raises an exception, this test is considered failed.
 <li>Assuming the <code>to_roman()</code> function was defined correctly, called correctly, completed successfully, and returned a value, the last step is to check whether it returned the <em>right</em> value. This is a common question, and the <code>TestCase</code> class provides a method, <code>assertEqual</code>, to check whether two values are equal. If the result returned from <code>to_roman()</code> (<var>result</var>) does not match the known value you were expecting (<var>numeral</var>), <code>assertEqual</code> will raise an exception and the test will fail. If the two values are equal, <code>assertEqual</code> will do nothing. If every value returned from <code>to_roman()</code> matches the known value you expect, <code>assertEqual</code> never raises an exception, so <code>testToRomanKnownValues</code> eventually exits normally, which means <code>to_roman()</code> has passed this test.
 </ol>
 <p>Once you have a test case, you can start coding the <code>to_roman()</code> function. First, you should stub it out as an empty function and make sure the tests fail. If the tests succeed before you've written any code, you're doing it wrong &mdash; your tests aren't testing your code at all! Write a test that fails, then code until it passes.
@@ -144,7 +145,7 @@ function to_roman(n):
     """convert integer to Roman numeral"""
 <a>    pass                                   <span>&#x2460;</span></a></code></pre>
 <ol>
-<li>At this stage, you want to define the <acronym>API</acronym> of the <code>to_roman()</code> function, but you don't want to code it yet. (Your test needs to fail first.) To stub it out, use the Python reserved word <code>pass</code> [FIXME ref], which does precisely nothing.</a>.
+<li>At this stage, you want to define the <abbr>API</abbr> of the <code>to_roman()</code> function, but you don't want to code it yet. (Your test needs to fail first.) To stub it out, use the Python reserved word <code>pass</code> [FIXME ref], which does precisely nothing.
 </ol>
 <p>Execute <code>romantest1.py</code> on the command line to run the test. If you call it with the <code>-v</code> command-line option, it will give more verbose output so you can see exactly what's going on as each test case runs. With any luck, your output should look like this:
 <pre class=screen>
@@ -289,7 +290,7 @@ FAILED (errors=1)</samp></pre>
 <p>Now run the test suite again.
 <pre class=screen>
 <samp class=prompt>you@localhost:~$ </samp><kbd>python3 romantest2.py -v</kbd>
-to_roman should give known result with known input ... ok
+<samp>to_roman should give known result with known input ... ok
 <a>to_roman should fail with large input ... FAIL                          <span>&#x2460;</span></a>
 
 ======================================================================
@@ -360,7 +361,7 @@ For instance, the <code>testFromRomanCase</code> method (&#8220;<code>from_roman
 <li>If you take a number, convert it to Roman numerals, then convert that back to a number, you should end up with the number
       you started with. So <code>from_roman(to_roman(n)) == n</code> for all <var>n</var> in <code>1..3999</code>.
 <li><code>to_roman</code> should always return a Roman numeral using uppercase letters.
-<li><code>from_roman</code> should only accept uppercase Roman numerals (<i class=foreignphrase><acronym>i.e.</acronym></i> it should fail when given lowercase input).
+<li><code>from_roman</code> should only accept uppercase Roman numerals (<i class=foreignphrase><abbr>i.e.</abbr></i> it should fail when given lowercase input).
 </ol>
 -->
 <p class=c>&copy; 2001&ndash;4, 2009 <span>&#x2133;</span>ark Pilgrim, <a href=http://creativecommons.org/licenses/by-sa/3.0/ rel=license>CC-BY-SA-3.0</a>
diff --git a/your-first-python-program.html b/your-first-python-program.html
index f2ef8ac..9513797 100644
--- a/your-first-python-program.html
+++ b/your-first-python-program.html
@@ -3,6 +3,7 @@
 <head>
 <meta charset=utf-8>
 <title>Your first Python program - Dive into Python 3</title>
+<!--[if IE]><script src="html5.js"></script><![endif]-->
 <link rel=stylesheet type=text/css href=dip3.css>
 <link rel="shortcut icon" href=data:image/ico,>
 <link rel=alternate type=application/atom+xml href=http://hg.diveintopython3.org/atom-log>
@@ -42,6 +43,7 @@ body{counter-reset:h1 1}
 <p class=fancy>Books about programming usually start with a bunch of boring chapters about fundamentals and eventually work up to building something useful. Let's skip all that. Here is a complete, working Python program. It probably makes absolutely no sense to you. Don't worry about that, because you're going to dissect it line by line. But read through it first and see what, if anything, you can make of it.
 <p id=noscript>[The code examples will be easier to follow if you enable Javascript, but whatever.]
 <p class=download>[<a href=humansize.py>download <code>humansize.py</code></a>]</p>
+<p class=skip><a href=#skip-humansize-py>skip over this code listing</a>
 <pre><code>SUFFIXES = {1000: ['KB', 'MB', 'GB', 'TB', 'PB', 'EB', 'ZB', 'YB'],
             1024: ['KiB', 'MiB', 'GiB', 'TiB', 'PiB', 'EiB', 'ZiB', 'YiB']}
 
@@ -70,7 +72,8 @@ def approximate_size(size, a_kilobyte_is_1024_bytes=True):
 if __name__ == "__main__":
     print(approximate_size(1000000000000, False))
     print(approximate_size(1000000000000))</code></pre>
-<p>Now let's run this program on the command line. On Windows, it will look something like this:
+<p id=skip-humansize-py>Now let's run this program on the command line. On Windows, it will look something like this:
+<p class=skip><a href=#skip-humansize-screen>skip over this command output listing</a>
 <pre class=screen>
 <samp class=prompt>c:\home\diveintopython3> </samp><kbd>c:\python30\python.exe humansize.py</kbd>
 <samp>1.0 TB
@@ -80,7 +83,7 @@ if __name__ == "__main__":
 <samp class=prompt>you@localhost:~$ </samp><kbd>python3 humansize.py</kbd>
 <samp>1.0 TB
 931.3 GiB</samp></pre>
-<!-- FIXME: this would be a good place to explain what the program, you know, actually does -->
+<p id=skip-humansize-screen>FIXME: this would be a good place to explain what the program, you know, actually does.
 <h2 id=declaringfunctions>Declaring functions</h2>
 <p>Python has functions like most other languages, but it does not have separate header files like <abbr>C++</abbr> or <code>interface</code>/<code>implementation</code> sections like Pascal. When you need a function, just declare it, like this:
 <pre><code>def approximate_size(size, a_kilobyte_is_1024_bytes=True):</code></pre>
@@ -120,6 +123,7 @@ if __name__ == "__main__":
 <p>I won't bore you with a long finger-wagging speech about the importance of documenting your code. Just know that code is written once but read many times, and the most important audience for your code is yourself, six months after writing it (i.e. after you've forgotten everything but need to fix something). Python makes it easy to write readable code, so take advantage of it. You'll thank me in six months.
 <h3 id=docstrings>Documentation strings</h3>
 <p>You can document a Python function by giving it a documentation string (<code>docstring</code> for short). In this program, the <code>approximate_size</code> function has a <code>docstring</code>:
+<p class=skip><a href=#skip-approximate-size>skip over this code listing</a>
 <pre><code>def approximate_size(size, a_kilobyte_is_1024_bytes=True):
     """Convert a file size to human-readable form.
 
@@ -131,7 +135,7 @@ if __name__ == "__main__":
     Returns: string
 
     """</code></pre>
-<p>Triple quotes signify a multi-line string. Everything between the start and end quotes is part of a single string, including carriage returns, leading white space, and other quote characters. You can use them anywhere, but you'll see them most often used when defining a <code>docstring</code>.
+<p id=skip-approximate-size>Triple quotes signify a multi-line string. Everything between the start and end quotes is part of a single string, including carriage returns, leading white space, and other quote characters. You can use them anywhere, but you'll see them most often used when defining a <code>docstring</code>.
 <blockquote class="note compare perl5">
 <p><span>&#x261E;</span>Triple quotes are also an easy way to define a string with both single and double quotes, like <code>qq/.../</code> in Perl 5.
 </blockquote>
@@ -146,6 +150,7 @@ if __name__ == "__main__":
 <h2 id=everythingisanobject>Everything is an object</h2>
 <p>In case you missed it, I just said that Python functions have attributes, and that those attributes are available at runtime. A function, like everything else in Python, is an object.
 <p>Run the interactive Python shell and follow along:
+<p class=skip><a href=#skip-everything-is-an-object-screen>skip over this interpreter listing</a>
 <pre class=screen>
 <a><samp class=prompt>>>> </samp><kbd>import humansize</kbd>                               <span>&#x2460;</span></a>
 <a><samp class=prompt>>>> </samp><kbd>print(humansize.approximate_size(4096, True))</kbd>  <span>&#x2461;</span></a>
@@ -161,7 +166,7 @@ if __name__ == "__main__":
     Returns: string
 
 </samp></pre>
-<ol>
+<ol id=skip-everything-is-an-object-screen>
 <li>The first line imports the <code>humansize</code> program as a module -- a chunk of code that you can use interactively, or from a larger Python program. (You'll see examples of multi-module Python programs in [FIXME xref].)  Once you import a module, you can reference any of its public functions, classes, or attributes. Modules can do this to access functionality in other modules, and you can do it in the Python interactive shell too. This is an important concept, and you'll see a lot more of it throughout this book.
 <li>When you want to use functions defined in imported modules, you need to include the module name. So you can't just say <code>approximate_size</code>; it must be <code>humansize.approximate_size</code>. If you've used classes in Java, this should feel vaguely familiar.
 <li>Instead of calling the function as you would expect to, you asked for one of the function's attributes, <code>__doc__</code>.
@@ -171,6 +176,7 @@ if __name__ == "__main__":
 </blockquote>
 <h3 id=importsearchpath>The <code>import</code> search path</h3>
 <p>Before this goes any further, I want to briefly mention the library search path. Python looks in several places when you try to import a module. Specifically, it looks in all the directories defined in <code>sys.path</code>. This is just a list, and you can easily view it or modify it with standard list methods. (You'll learn more about lists later in this chapter.)
+<p class=skip><a href=#skip-import-search-path-screen>skip over this interpreter listing</a>
 <pre class=screen>
 <a><samp class=prompt>>>> </samp><kbd>import sys</kbd>                       <span>&#x2460;</span></a>
 <a><samp class=prompt>>>> </samp><kbd>sys.path</kbd>                         <span>&#x2461;</span></a>
@@ -178,7 +184,7 @@ if __name__ == "__main__":
 <a><samp class=prompt>>>> </samp><kbd>sys</kbd>                              <span>&#x2462;</span></a>
 <samp>&lt;module 'sys' (built-in)></samp>
 <a><samp class=prompt>>>> </samp><kbd>sys.path.append('/my/new/path')</kbd>  <span>&#x2463;</span></a></pre>
-<ol>
+<ol id=skip-import-search-path-screen>
 <li>Importing the <code>sys</code> module makes all of its functions and attributes available.
 <li><code>sys.path</code> is a list of directory names that constitute the current search path. (Yours will look different, depending on your operating system, what version of Python you're running, and where it was originally installed.)  Python will look through these directories (in this order) for a <code>.py</code> file whose name matches what you're trying to import.
 <li>Actually, I lied; the truth is more complicated than that, because not all modules are stored as <code>.py</code> files. Some, like the <code>sys</code> module, are "built-in modules"; they are actually baked right into Python itself. Built-in modules behave just like regular modules, but their Python source code is not available, because they are not written in Python!  (The <code>sys</code> module is written in <abbr>C</abbr>.)
@@ -190,6 +196,7 @@ if __name__ == "__main__":
 <p>This is so important that I'm going to repeat it in case you missed it the first few times: <em>everything in Python is an object</em>. Strings are objects. Lists are objects. Functions are objects. Even modules are objects.
 <h2 id=indentingcode>Indenting code</h2>
 <p>Python functions have no explicit <code>begin</code> or <code>end</code>, and no curly braces to mark where the function code starts and stops. The only delimiter is a colon (<code>:</code>) and the indentation of the code itself.
+<p class=skip><a href=#skip-indenting-code>skip over this code listing</a>
 <pre><code>
 <a>def approximate_size(size, a_kilobyte_is_1024_bytes=True):  <span>&#x2460;</span></a>
 <a>    if size &lt; 0:                                            <span>&#x2461;</span></a>
@@ -202,7 +209,7 @@ if __name__ == "__main__":
             return "{0:.1f} {1}".format(size, suffix)
 
     raise ValueError('number too large')</code></pre>
-<ol>
+<ol id=skip-indenting-code>
 <li>Code blocks are defined by their indentation. By "code block," I mean functions, <code>if</code> statements, <code>for</code> loops, <code>while</code> loops, and so forth. Indenting starts a block and unindenting ends it. There are no explicit braces, brackets, or keywords. This means that whitespace is significant, and must be consistent. In this example, the function code is indented four spaces. It doesn't need to be four spaces, it just needs to be consistent. The first line that is not indented marks the end of the function.
 <li>In Python, an <code>if</code> statement is followed by a code block. If the <code>if</code> expression evaluates to true, the indented block is executed, otherwise it falls to the <code>else</code> block (if any). (Note the lack of parentheses around the expression.)
 <li>This line is inside the <code>if</code> code block. This <code>raise</code> statement will raise an exception (of type <code>ValueError</code>), but only if <code>size &lt; 0</code>.
@@ -215,19 +222,22 @@ if __name__ == "__main__":
 </blockquote>
 <h2 id=runningscripts>Running scripts</h2>
 <p>Python modules are objects and have several useful attributes. You can use this to easily test your modules as you write them, by including a special block of code that executes when you run the Python file on the command line. Take the last few lines of <code>humansize.py</code>:
+<p class=skip><a href=#skip-running-scripts>skip over this code listing</a>
 <pre><code>
 if __name__ == "__main__":
     print(approximate_size(1000000000000, False))
     print(approximate_size(1000000000000))</code></pre>
-<blockquote class="note compare clang">
+<blockquote class="note compare clang" id=skip-running-scripts>
 <p><span>&#x261E;</span>Like <abbr>C</abbr>, Python uses <code>==</code> for comparison and <code>=</code> for assignment. Unlike <abbr>C</abbr>, Python does not support in-line assignment, so there's no chance of accidentally assigning the value you thought you were comparing.
 </blockquote>
 <p>So what makes this <code>if</code> statement special?  Well, modules are objects, and all modules have a built-in attribute <code>__name__</code>. A module's <code>__name__</code> depends on how you're using the module. If you <code>import</code> the module, then <code>__name__</code> is the module's filename, without a directory path or file extension.
+<p class=skip><a href=#skip-import-humansize>skip over this interpreter listing</a>
 <pre class=screen>
 <samp class=prompt>>>> </samp><kbd>import humansize</kbd>
 <samp class=prompt>>>> </samp><kbd>humansize.__name__</kbd>
 <samp>'humansize'</samp></pre>
-<p>But you can also run the module directly as a standalone program, in which case <code>__name__</code> will be a special default value, <code>__main__</code>. Python will evaluate this <code>if</code> statement, find a true expression, and execute the <code>if</code> code block. In this case, to print two values.
+<p id=skip-import-humansize>But you can also run the module directly as a standalone program, in which case <code>__name__</code> will be a special default value, <code>__main__</code>. Python will evaluate this <code>if</code> statement, find a true expression, and execute the <code>if</code> code block. In this case, to print two values.
+<p class=skip><a href=#furtherreading>skip over this command output listing</a>
 <pre class=screen>
 <samp class=prompt>c:\home\diveintopython3> </samp><kbd>c:\python30\python.exe humansize.py</kbd>
 <samp>1.0 TB